Prompt-Transferability
391 строка · 12.1 Кб
1import os2#import shutil
3import shutil4import torch5
6all_model_prompt = os.listdir("model")7
8all_model_prompt = [dir for dir in all_model_prompt if ".py" not in dir]9
10
11for dataset_file in all_model_prompt:12#if "T5" not in dataset_file or "Small" in dataset_file:13#if "RobertaLarge" not in dataset_file or "Small" in dataset_file:14# continue15#if "Small" not in dataset_file or "sam" not in dataset_file:16if "T5Large" not in dataset_file:17continue18
19#if dataset_file != "QQPPromptRoberta":20# continue21
22
23#if dataset_file != "ethicscommonsensePromptRoberta":24#if dataset_file != "MRPCPromptRoberta":25# continue26
27#print(file)28
29original_dir = "model/"+str(dataset_file)30if os.path.isdir(original_dir):31pass32else:33continue34
35check_list = [file for file in os.listdir(original_dir) if "_task_prompt" in file]36if len(check_list) == 0:37continue38
39##:mean do not use40
41##Choose epoch42max_epoch = 043
44#Haven't done45
46
47#tweet #training (68.XX)48#ethicsdeontologyPromptT5 (63.8)49#ethicsjusticePromptT5 (60.XX)50#QQP (86.6)51#squadPromptT5 (62.7)52#nq_openPromptT553#multi_newsPromptT554#samsumPromptT555
56#MNLI #training57#snli #training58
59
60if dataset_file == "IMDBPromptRoberta":61max_epoch = 2362elif dataset_file == "IMDBPromptRobertaSmall":63max_epoch = 2964elif dataset_file == "IMDBPromptRobertaLarge":65max_epoch = 2766elif dataset_file == "IMDBPromptRoberta_label":67max_epoch = 4068elif dataset_file == "IMDBPromptBert":69max_epoch = 2170elif dataset_file == "IMDBPromptT5":71max_epoch = 7072elif dataset_file == "IMDBPromptT5Small":73max_epoch = 69 #4574elif dataset_file == "IMDBPromptT5Large":75max_epoch = 6076
77elif dataset_file == "SST2PromptRoberta":78max_epoch = 2579elif dataset_file == "SST2PromptRobertaSmall":80max_epoch = 3881elif dataset_file == "SST2PromptRobertaLarge":82max_epoch = 2683elif dataset_file == "SST2PromptRoberta_label":84max_epoch = 1885elif dataset_file == "SST2PromptBert":86max_epoch = 1887elif dataset_file == "SST2PromptT5":88max_epoch = 2689elif dataset_file == "SST2PromptT5Small":90max_epoch = 17 #991elif dataset_file == "SST2PromptT5Large":92max_epoch = 3693
94elif dataset_file == "laptopPromptRoberta":95max_epoch = 3296elif dataset_file == "laptopPromptRobertaSmall":97max_epoch = 4098elif dataset_file == "laptopPromptRobertaLarge":99max_epoch = 93100elif dataset_file == "laptopPromptRoberta_label":101max_epoch = 32102elif dataset_file == "laptopPromptBert":103max_epoch = 30104elif dataset_file == "laptopPromptT5":105max_epoch = 210106elif dataset_file == "laptopPromptT5Small":107max_epoch = 229 #92108elif dataset_file == "laptopPromptT5Large":109max_epoch = 499110
111elif dataset_file == "restaurantPromptRoberta":112max_epoch = 33113elif dataset_file == "restaurantPromptRobertaSmall":114max_epoch = 50115elif dataset_file == "restaurantPromptRobertaLarge":116max_epoch = 126117elif dataset_file == "restaurantPromptRoberta_label":118max_epoch = 32119elif dataset_file == "restaurantPromptBert":120max_epoch = 31121elif dataset_file == "restaurantPromptT5":122max_epoch = 276123elif dataset_file == "restaurantPromptT5Small":124max_epoch = 224 #162125elif dataset_file == "restaurantPromptT5Large":126max_epoch = 100127
128elif dataset_file == "movierationalesPromptRoberta":129max_epoch = 21130elif dataset_file == "movierationalesPromptRobertaSmall":131max_epoch = 31132elif dataset_file == "movierationalesPromptRobertaLarge":133max_epoch = 62134elif dataset_file == "movierationalesPromptRoberta_label":135max_epoch = 48136elif dataset_file == "movierationalesPromptBert":137max_epoch = 24138elif dataset_file == "movierationalesPromptT5":139max_epoch = 197140elif dataset_file == "movierationalesPromptT5Small":141max_epoch = 373 #299142elif dataset_file == "movierationalesPromptT5Large":143max_epoch = 100144
145elif dataset_file == "tweetevalsentimentPromptRoberta":146max_epoch = 28147elif dataset_file == "tweetevalsentimentPromptRobertaSmall":148max_epoch = 37149elif dataset_file == "tweetevalsentimentPromptRobertaLarge":150max_epoch = 54151elif dataset_file == "tweetevalsentimentPromptRoberta_label":152max_epoch = 23153elif dataset_file == "tweetevalsentimentPromptBert":154max_epoch = 21155elif dataset_file == "tweetevalsentimentPromptT5":156max_epoch = 18157elif dataset_file == "tweetevalsentimentPromptT5Small":158max_epoch = 32 #20 better159elif dataset_file == "tweetevalsentimentPromptT5Large":160max_epoch = 38161
162
163elif dataset_file == "MNLIPromptRoberta":164max_epoch = 44165elif dataset_file == "MNLIPromptRobertaSmall":166max_epoch = 13167elif dataset_file == "MNLIPromptRobertaLarge":168max_epoch = 10 ###169elif dataset_file == "MNLIPromptRoberta_label":170max_epoch = 30171elif dataset_file == "MNLIPromptBert":172max_epoch = 34173elif dataset_file == "MNLIPromptT5":174max_epoch = 5175elif dataset_file == "MNLIPromptT5Small":176max_epoch = 4 ##177
178
179elif dataset_file == "QNLIPromptRoberta":180max_epoch = 51181elif dataset_file == "QNLIPromptRobertaSmall":182max_epoch = 48183elif dataset_file == "QNLIPromptRobertaLarge":184max_epoch = 33 ###185elif dataset_file == "QNLIPromptRoberta_label":186max_epoch = 67187elif dataset_file == "QNLIPromptBert":188max_epoch = 41189elif dataset_file == "QNLIPromptT5":190max_epoch = 30191elif dataset_file == "QNLIPromptT5Small":192max_epoch = 11 ##193
194elif dataset_file == "WNLIPromptRoberta":195max_epoch = 755196elif dataset_file == "WNLIPromptRoberta_label":197max_epoch = 755198elif dataset_file == "WNLIPromptBert":199max_epoch = 754200
201elif dataset_file == "snliPromptRoberta":202max_epoch = 29203elif dataset_file == "snliPromptRobertaSmall":204max_epoch = 9205elif dataset_file == "snliPromptRobertaLarge":206max_epoch = 4 ###207elif dataset_file == "snliPromptRoberta_label":208max_epoch = 17209elif dataset_file == "snliPromptBert":210max_epoch = 32211elif dataset_file == "snliPromptT5":212max_epoch = 2213elif dataset_file == "snliPromptT5Small":214max_epoch = 2 #215
216
217elif dataset_file =="RTEPromptRoberta":218max_epoch = 250219elif dataset_file =="RTEPromptRoberta_label":220max_epoch = 250221elif dataset_file =="RTEPromptBert":222max_epoch = 249223
224
225elif dataset_file == "QQPPromptRoberta":226max_epoch = 22227elif dataset_file == "QQPPromptRobertaSmall":228max_epoch = 17229elif dataset_file == "QQPPromptRobertaLarge":230max_epoch = 8 ###231elif dataset_file == "QQPPromptRoberta_label":232max_epoch = 26233elif dataset_file == "QQPPromptBert":234max_epoch = 24235elif dataset_file == "QQPPromptT5":236max_epoch = 10237elif dataset_file == "QQPPromptT5Small":238max_epoch = 2 ###239
240elif dataset_file == "MRPCPromptRoberta":241max_epoch = 66242elif dataset_file == "MRPCPromptRobertaSmall":243max_epoch = 53244elif dataset_file == "MRPCPromptRobertaLarge":245max_epoch = 96246elif dataset_file == "MRPCPromptRoberta_label":247max_epoch = 30248elif dataset_file == "MRPCPromptBert":249max_epoch = 27250elif dataset_file == "MRPCPromptT5":251max_epoch = 199252elif dataset_file == "MRPCPromptT5Small":253max_epoch = 213254
255
256elif dataset_file == "recastfactualityPromptRoberta":257max_epoch = 21258elif dataset_file == "recastfactualityPromptRoberta_label":259max_epoch = 21260elif dataset_file == "recastfactualityPromptBert":261max_epoch = 20262
263elif dataset_file == "recastpunsPromptRoberta":264max_epoch = 36265elif dataset_file == "recastpunsPromptRoberta_label":266max_epoch = 36267elif dataset_file == "recastpunsPromptBert":268max_epoch = 35269
270elif dataset_file == "recastverbcornerPromptRoberta":271max_epoch = 35272elif dataset_file == "recastverbcornerPromptRoberta_label":273max_epoch = 35274elif dataset_file == "recastverbcornerPromptBert":275max_epoch = 34276
277elif dataset_file == "recastnerPromptRoberta":278max_epoch = 30279elif dataset_file == "recastnerPromptRoberta_label":280max_epoch = 18281elif dataset_file == "recastnerPromptBert":282max_epoch = 20283
284elif dataset_file == "recastsentimentPromptRoberta":285max_epoch = 58286elif dataset_file == "recastsentimentPromptRoberta_label":287max_epoch = 58288elif dataset_file == "recastsentimentPromptBert":289max_epoch = 57290
291elif dataset_file == "recastmegaveridicalityPromptRoberta":292max_epoch = 32293elif dataset_file == "recastmegaveridicalityPromptRoberta_label":294max_epoch = 32295elif dataset_file == "recastmegaveridicalityPromptBert":296max_epoch = 31297
298elif dataset_file == "ethicscommonsensePromptRoberta":299max_epoch = 96300elif dataset_file == "ethicscommonsensePromptRoberta_label":301max_epoch = 96302elif dataset_file == "ethicscommonsensePromptBert":303max_epoch = 95304
305elif dataset_file == "ethicsdeontologyPromptRoberta":306max_epoch = 63307elif dataset_file == "ethicsdeontologyPromptRobertaSmall":308max_epoch = 61309elif dataset_file == "ethicsdeontologyPromptRobertaLarge":310max_epoch = 79 #125 ###311elif dataset_file == "ethicsdeontologyPromptRoberta_label":312max_epoch = 77313elif dataset_file == "ethicsdeontologyPromptBert":314max_epoch = 14315elif dataset_file == "ethicsdeontologyPromptT5":316max_epoch = 101317elif dataset_file == "ethicsdeontologyPromptT5Small":318max_epoch = 52 #319
320elif dataset_file == "ethicsjusticePromptRoberta":321max_epoch = 29322elif dataset_file == "ethicsjusticePromptRobertaSmall":323max_epoch = 150324elif dataset_file == "ethicsjusticePromptRobertaLarge":325max_epoch = 68 #127 ###326elif dataset_file == "ethicsjusticePromptRoberta_label":327max_epoch = 63328elif dataset_file == "ethicsjusticePromptBert":329max_epoch = 15330elif dataset_file == "ethicsjusticePromptT5":331max_epoch = 141332elif dataset_file == "ethicsjusticePromptT5Small":333max_epoch = 48334##elif dataset_file == "ethicsvirtuePromptRoberta":335## max_epoch = 21336
337
338elif dataset_file == "squadPromptT5":339max_epoch = 23340elif dataset_file == "squadPromptT5Small":341max_epoch = 11 ##342elif dataset_file == "nq_openPromptT5":343max_epoch = 15344elif dataset_file == "nq_openPromptT5Small":345max_epoch = 11 ##346elif dataset_file == "multi_newsPromptT5":347max_epoch = 21348elif dataset_file == "multi_newsPromptT5Small":349max_epoch = 16 ##350elif dataset_file == "samsumPromptT5":351max_epoch = 85352elif dataset_file == "samsumPromptT5Small":353max_epoch = 28 ###354
355
356else:357print("--------------------")358print("Did not need to genertate this promt_emb:", dataset_file)359print("--------------------")360continue361'''362for file in os.listdir(original_dir):
363present_epoch = int(file.strip().split("_")[0])
364if present_epoch > max_epoch:
365max_epoch = present_epoch
366'''
367
368original_dir = original_dir+"/"+str(max_epoch)+"_task_prompt.pkl"369
370
371
372try:373parameters = torch.load(original_dir, map_location=lambda storage, loc: storage)374prompt_emb = parameters["model"]375except:376print(dataset_file,"has no trained task_prompt.pkl at epoch",max_epoch)377continue378
379
380target_dir = "task_prompt_emb"+"/"+str(dataset_file)381if os.path.isdir(target_dir):382pass383else:384os.mkdir(target_dir)385
386
387target_dir = target_dir+"/"+"task_prompt"388
389torch.save(prompt_emb, target_dir)390
391print("Save:", target_dir, " Done")392
393