mirror of
https://github.com/huggingface/transformers.git
synced 2025-07-14 01:58:22 +06:00

* Add deebert code * Add readme of deebert * Add test for deebert Update test for Deebert * Update DeeBert (README, class names, function refactoring); remove requirements.txt * Format update * Update test * Update readme and model init methods
31 lines
790 B
Bash
Executable File
31 lines
790 B
Bash
Executable File
#!/bin/bash
|
|
export CUDA_VISIBLE_DEVICES=0
|
|
|
|
PATH_TO_DATA=/h/xinji/projects/GLUE
|
|
|
|
MODEL_TYPE=bert # bert or roberta
|
|
MODEL_SIZE=base # base or large
|
|
DATASET=MRPC # SST-2, MRPC, RTE, QNLI, QQP, or MNLI
|
|
|
|
MODEL_NAME=${MODEL_TYPE}-${MODEL_SIZE}
|
|
if [ $MODEL_TYPE = 'bert' ]
|
|
then
|
|
MODEL_NAME=${MODEL_NAME}-uncased
|
|
fi
|
|
|
|
|
|
python -u run_glue_deebert.py \
|
|
--model_type $MODEL_TYPE \
|
|
--model_name_or_path ./saved_models/${MODEL_TYPE}-${MODEL_SIZE}/$DATASET/two_stage \
|
|
--task_name $DATASET \
|
|
--do_eval \
|
|
--do_lower_case \
|
|
--data_dir $PATH_TO_DATA/$DATASET \
|
|
--output_dir ./saved_models/${MODEL_TYPE}-${MODEL_SIZE}/$DATASET/two_stage \
|
|
--plot_data_dir ./results/ \
|
|
--max_seq_length 128 \
|
|
--eval_each_highway \
|
|
--eval_highway \
|
|
--overwrite_cache \
|
|
--per_gpu_eval_batch_size=1
|