rulm
26 строк · 778.0 Байт
1{
2"trainer": {
3"evaluation_strategy": "steps",
4"per_device_train_batch_size": 16,
5"per_device_eval_batch_size": 16,
6"gradient_accumulation_steps": 2,
7"eval_steps": 150,
8"save_steps": 150,
9"logging_steps": 10,
10"learning_rate": 0.00003,
11"num_train_epochs": 3,
12"lr_scheduler_type": "cosine",
13"warmup_steps": 100,
14"fp16": false,
15"bf16": true,
16"gradient_checkpointing": false,
17"torch_compile": false,
18"optim": "adamw_torch",
19"half_precision_backend": "auto",
20"fp16_opt_level": "O2"
21},
22"model_name": "sberbank-ai/ruT5-base",
23"model_type": "seq2seq",
24"max_source_tokens_count": 256,
25"max_target_tokens_count": 256
26}
27
28