Files
2025-09-21 02:59:47 +00:00

38 lines
784 B
YAML

### model
model_config_path: model_configs/model_config_small.json
tokenizer: data/tokenizer
### dataset
data_path: data/raw_dataset/VirusComment.py
dataloader_num_workers: 8
### output
run_name: viruscommentcls-training
output_dir: data/output_models/viruscommentcls_9
overwrite_output_dir: true
save_strategy: epoch
report_to: tensorboard
logging_steps: 1
### train
do_train: true
num_train_epochs: 25
per_device_train_batch_size: 32
gradient_accumulation_steps: 32
optim: adamw_torch
learning_rate: 4.3e-5
lr_scheduler_type: cosine
warmup_ratio: 0.05
fp16: true
ddp_backend: null
ddp_timeout: 180000000
loss_type: 'cross_entropy'
focal_alpha: 1.0
focal_gamma: 2.0
label_smoothing: 0.0
### eval
do_eval: true
per_device_eval_batch_size: 128
eval_strategy: steps
eval_steps: 0.02