openprompt
69 строк · 1.3 Кб
1dataset:2name: super_glue.boolq3path: # dataset in huggingface doesn't need path4
5plm:6model_name: t57model_path: t5-large8optimize:9freeze_para: True10lr: 1.0e-511weight_decay: 0.012scheduler:13type:14num_warmup_steps: 50015
16dataloader:17max_seq_length: 256 # max_seq_length18decoder_max_length: 3 # the decoder max length to truncate decoder input sequence19# if it is an encoder-decoder architecture. Note that it's not equavalent20# to generation.max_length which is used merely in the generation phase.21truncate_method: "head" # choosing from balanced, head, tail22decode_from_pad: true23
24train:25batch_size: 826gradient_accumulation_steps: 127max_grad_norm: 1.028num_epochs:29num_training_steps: 3000030
31
32test:33batch_size: 1634
35dev:36batch_size: 1637
38
39template: soft_template40verbalizer: manual_verbalizer41
42
43
44soft_template:45choice: 046file_path: scripts/SuperGLUE/BoolQ/soft_template.txt47num_tokens: 2048initialize_from_vocab: true49random_range: 0.550optimize:51name: AdamW52lr: 0.353adam_epsilon: 1.0e-854scheduler:55num_warmup_steps: 50056
57
58manual_verbalizer:59choice: 060file_path: scripts/SuperGLUE/BoolQ/manual_verbalizer.txt61
62environment:63num_gpus: 364cuda_visible_devices:65local_rank: 066model_parallel: True67device_map:68
69learning_setting: full