rulm
34 строки · 964.0 Байт
1{
2"trainer": {3"evaluation_strategy": "steps",4"per_device_train_batch_size": 1,5"per_device_eval_batch_size": 1,6"gradient_accumulation_steps": 128,7"eval_steps": 5,8"save_steps": 5,9"logging_steps": 1,10"learning_rate": 0.0003,11"num_train_epochs": 3,12"lr_scheduler_type": "cosine",13"warmup_steps": 10,14"fp16": false,15"bf16": true,16"torch_compile": false,17"optim": "adamw_torch"18},19"lora": {20"r": 8,21"lora_alpha": 16,22"lora_dropout": 0.25,23"bias": "none",24"target_modules": ["q_proj", "v_proj", "k_proj", "o_proj"],25"task_type": "CAUSAL_LM"26},27"load_in_8bit": true,28"only_target_loss": true,29"mode": "chat",30"templates_path": "internal_prompts/saiga_v2.json",31"model_name": "models/vicuna-13b-v1.5",32"model_type": "causal",33"max_tokens_count": 256034}
35
36