1
2
3
4
5
6
7
8
9
10
11
12
13
14
|
- model: TrainingArguments(output_dir=./results, overwrite_output_dir=False, do_train=False,
- do_eval=None, do_predict=False, evaluation_strategy=EvaluationStrategy.NO, prediction_loss_only=False,
- per_device_train_batch_size=16, per_device_eval_batch_size=64, gradient_accumulation_steps=1,
- eval_accumulation_steps=None, learning_rate=5e-05, weight_decay=0.01, adam_beta1=0.9,
- adam_beta2=0.999, adam_epsilon=1e-08, max_grad_norm=1.0, num_train_epochs=3, max_steps=-1,
- lr_scheduler_type=SchedulerType.LINEAR, warmup_steps=500, logging_dir=./logs, logging_first_step=False,
- logging_steps=10, save_steps=500, save_total_limit=None, no_cuda=False, seed=42,
- fp16=False, fp16_opt_level=O1, fp16_backend=auto, local_rank=-1, tpu_num_cores=None,
- tpu_metrics_debug=False, debug=False, dataloader_drop_last=False, eval_steps=10,
- dataloader_num_workers=0, past_index=-1, run_name=./results, disable_tqdm=False,
- remove_unused_columns=True, label_names=None, load_best_model_at_end=False, metric_for_best_model=None,
- greater_is_better=None, ignore_data_skip=False, sharded_ddp=False, deepspeed=None,
- label_smoothing_factor=0.0, adafactor=False, _n_gpu=0)
- model_class: Trainer
|