File tree 1 file changed +5
-5
lines changed
1 file changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -149,12 +149,12 @@ def load(self):
149
149
def train ():
150
150
args = parse_args ()
151
151
args_dict = {
152
- "model_name_or_path" : 'google/byt5-small ' ,
152
+ "model_name_or_path" : 'Langboat/mengzi-t5-base ' ,
153
153
"max_len" : 128 ,
154
- "output_dir" : os .path .join (args .save_dir , './byt5-small -chinese-correction' ),
154
+ "output_dir" : os .path .join (args .save_dir , './mengzi-t5-base -chinese-correction' ),
155
155
"overwrite_output_dir" : True ,
156
- "per_device_train_batch_size" : 32 ,
157
- "per_device_eval_batch_size" : 32 ,
156
+ "per_device_train_batch_size" : 64 ,
157
+ "per_device_eval_batch_size" : 64 ,
158
158
"gradient_accumulation_steps" : 4 ,
159
159
"learning_rate" : 5e-4 ,
160
160
"warmup_steps" : 250 ,
@@ -166,7 +166,7 @@ def train():
166
166
"do_eval" : True ,
167
167
"fp16" : False ,
168
168
"use_cache" : False ,
169
- "max_steps" : 5000 , # default 5000
169
+ # "max_steps": 5000,
170
170
}
171
171
parser = HfArgumentParser (
172
172
(ModelArguments , DataTrainingArguments , TrainingArguments ))
You can’t perform that action at this time.
0 commit comments