Releases: microsoft/ContextualSP
Releases · microsoft/ContextualSP
Pretrained Weights of SParC BERT-based Action Copy Model
{
"best_epoch": 13,
"peak_cpu_memory_MB": 0,
"peak_gpu_0_memory_MB": 1,
"peak_gpu_1_memory_MB": 22815,
"peak_gpu_2_memory_MB": 22671,
"peak_gpu_3_memory_MB": 19426,
"peak_gpu_4_memory_MB": 22798,
"peak_gpu_5_memory_MB": 17284,
"peak_gpu_6_memory_MB": 21951,
"peak_gpu_7_memory_MB": 1,
"training_duration": "11:21:16.976743",
"training_start_epoch": 0,
"training_epochs": 22,
"epoch": 22,
"training_action_exact_match": 0,
"training__action_inter_exact_match": 0,
"training__action_turn_1_exact_match": 0,
"training__action_turn_2_exact_match": 0,
"training__action_turn_3_exact_match": 0,
"training__action_turn_4_exact_match": 0,
"training_sql_exact_match": 0,
"training__sql_inter_exact_match": 0,
"training__sql_turn_1_exact_match": 0,
"training__sql_turn_2_exact_match": 0,
"training__sql_turn_3_exact_match": 0,
"training__sql_turn_4_exact_match": 0,
"training__copy": 0,
"training_info": 0,
"training_loss": 0.19148788920165136,
"training_cpu_memory_MB": 0.0,
"training_gpu_0_memory_MB": 1,
"training_gpu_1_memory_MB": 22325,
"training_gpu_2_memory_MB": 19190,
"training_gpu_3_memory_MB": 19426,
"training_gpu_4_memory_MB": 18642,
"training_gpu_5_memory_MB": 16566,
"training_gpu_6_memory_MB": 19856,
"training_gpu_7_memory_MB": 1,
"validation_action_exact_match": 0.43308395677472983,
"validation__action_inter_exact_match": 0.22037914691943128,
"validation__action_turn_1_exact_match": 0.6255924170616114,
"validation__action_turn_2_exact_match": 0.3909952606635071,
"validation__action_turn_3_exact_match": 0.2962962962962963,
"validation__action_turn_4_exact_match": 0.1348314606741573,
"validation_sql_exact_match": 0.4546965918536991,
"validation__sql_inter_exact_match": 0.25118483412322273,
"validation__sql_turn_1_exact_match": 0.6421800947867299,
"validation__sql_turn_2_exact_match": 0.41706161137440756,
"validation__sql_turn_3_exact_match": 0.3148148148148148,
"validation__sql_turn_4_exact_match": 0.16853932584269662,
"validation__copy": 0,
"validation_info": 0,
"validation_loss": 0.3569193813490231,
"best_validation_action_exact_match": 0.4455527847049044,
"best_validation__action_inter_exact_match": 0.22274881516587677,
"best_validation__action_turn_1_exact_match": 0.6255924170616114,
"best_validation__action_turn_2_exact_match": 0.4052132701421801,
"best_validation__action_turn_3_exact_match": 0.3111111111111111,
"best_validation__action_turn_4_exact_match": 0.19101123595505617,
"best_validation_sql_exact_match": 0.4605153782211139,
"best_validation__sql_inter_exact_match": 0.24407582938388625,
"best_validation__sql_turn_1_exact_match": 0.6374407582938388,
"best_validation__sql_turn_2_exact_match": 0.4218009478672986,
"best_validation__sql_turn_3_exact_match": 0.32222222222222224,
"best_validation__sql_turn_4_exact_match": 0.2247191011235955,
"best_validation__copy": 0,
"best_validation_info": 0,
"best_validation_loss": 0.32762717183953
}
Pretrained Weights of CoSQL Turn Model
{
"best_epoch": 24,
"peak_cpu_memory_MB": 0,
"peak_gpu_0_memory_MB": 1,
"peak_gpu_1_memory_MB": 22815,
"peak_gpu_2_memory_MB": 22671,
"peak_gpu_3_memory_MB": 19422,
"peak_gpu_4_memory_MB": 22974,
"peak_gpu_5_memory_MB": 17284,
"peak_gpu_6_memory_MB": 21951,
"peak_gpu_7_memory_MB": 1,
"training_duration": "6:32:27.738503",
"training_start_epoch": 0,
"training_epochs": 33,
"epoch": 33,
"training_action_exact_match": 0,
"training__action_inter_exact_match": 0,
"training__action_turn_1_exact_match": 0,
"training__action_turn_2_exact_match": 0,
"training__action_turn_3_exact_match": 0,
"training__action_turn_4_exact_match": 0,
"training_sql_exact_match": 0,
"training__sql_inter_exact_match": 0,
"training__sql_turn_1_exact_match": 0,
"training__sql_turn_2_exact_match": 0,
"training__sql_turn_3_exact_match": 0,
"training__sql_turn_4_exact_match": 0,
"training_loss": 0.18920585506216245,
"training_cpu_memory_MB": 0.0,
"training_gpu_0_memory_MB": 1,
"training_gpu_1_memory_MB": 22237,
"training_gpu_2_memory_MB": 19158,
"training_gpu_3_memory_MB": 19422,
"training_gpu_4_memory_MB": 20185,
"training_gpu_5_memory_MB": 17284,
"training_gpu_6_memory_MB": 21951,
"training_gpu_7_memory_MB": 1,
"validation_action_exact_match": 0.29890764647467727,
"validation__action_inter_exact_match": 0.07167235494880546,
"validation__action_turn_1_exact_match": 0.36860068259385664,
"validation__action_turn_2_exact_match": 0.2771929824561403,
"validation__action_turn_3_exact_match": 0.26229508196721313,
"validation__action_turn_4_exact_match": 0.2702702702702703,
"validation_sql_exact_match": 0.29791459781529295,
"validation__sql_inter_exact_match": 0.08191126279863481,
"validation__sql_turn_1_exact_match": 0.378839590443686,
"validation__sql_turn_2_exact_match": 0.2736842105263158,
"validation__sql_turn_3_exact_match": 0.26229508196721313,
"validation__sql_turn_4_exact_match": 0.25405405405405407,
"validation_loss": 0.47665515542030334,
"best_validation_action_exact_match": 0.32075471698113206,
"best_validation__action_inter_exact_match": 0.09215017064846416,
"best_validation__action_turn_1_exact_match": 0.3890784982935154,
"best_validation__action_turn_2_exact_match": 0.2912280701754386,
"best_validation__action_turn_3_exact_match": 0.29098360655737704,
"best_validation__action_turn_4_exact_match": 0.2972972972972973,
"best_validation_sql_exact_match": 0.3187686196623635,
"best_validation__sql_inter_exact_match": 0.09897610921501707,
"best_validation__sql_turn_1_exact_match": 0.3993174061433447,
"best_validation__sql_turn_2_exact_match": 0.28421052631578947,
"best_validation__sql_turn_3_exact_match": 0.28688524590163933,
"best_validation__sql_turn_4_exact_match": 0.2864864864864865,
"best_validation_loss": 0.45512670278549194
}
Pretrained Weights of CoSQL Action Copy Model
{
"best_epoch": 35,
"peak_cpu_memory_MB": 0,
"peak_gpu_0_memory_MB": 1,
"peak_gpu_1_memory_MB": 22811,
"peak_gpu_2_memory_MB": 22671,
"peak_gpu_3_memory_MB": 19426,
"peak_gpu_4_memory_MB": 22798,
"peak_gpu_5_memory_MB": 17286,
"peak_gpu_6_memory_MB": 21951,
"peak_gpu_7_memory_MB": 1,
"training_duration": "12:23:41.284435",
"training_start_epoch": 0,
"training_epochs": 44,
"epoch": 44,
"training_action_exact_match": 0,
"training__action_inter_exact_match": 0,
"training__action_turn_1_exact_match": 0,
"training__action_turn_2_exact_match": 0,
"training__action_turn_3_exact_match": 0,
"training__action_turn_4_exact_match": 0,
"training_sql_exact_match": 0,
"training__sql_inter_exact_match": 0,
"training__sql_turn_1_exact_match": 0,
"training__sql_turn_2_exact_match": 0,
"training__sql_turn_3_exact_match": 0,
"training__sql_turn_4_exact_match": 0,
"training__copy": 0,
"training_info": 0,
"training_loss": 0.17617646926255137,
"training_cpu_memory_MB": 0.0,
"training_gpu_0_memory_MB": 1,
"training_gpu_1_memory_MB": 3,
"training_gpu_2_memory_MB": 1743,
"training_gpu_3_memory_MB": 19426,
"training_gpu_4_memory_MB": 1981,
"training_gpu_5_memory_MB": 16566,
"training_gpu_6_memory_MB": 19858,
"training_gpu_7_memory_MB": 1,
"validation_action_exact_match": 0.30883813306852037,
"validation__action_inter_exact_match": 0.07849829351535836,
"validation__action_turn_1_exact_match": 0.3822525597269625,
"validation__action_turn_2_exact_match": 0.2771929824561403,
"validation__action_turn_3_exact_match": 0.28688524590163933,
"validation__action_turn_4_exact_match": 0.2702702702702703,
"validation_sql_exact_match": 0.3118172790466733,
"validation__sql_inter_exact_match": 0.08532423208191127,
"validation__sql_turn_1_exact_match": 0.3993174061433447,
"validation__sql_turn_2_exact_match": 0.2807017543859649,
"validation__sql_turn_3_exact_match": 0.29098360655737704,
"validation__sql_turn_4_exact_match": 0.24864864864864866,
"validation__copy": 0,
"validation_info": 0,
"validation_loss": 0.42742106318473816,
"best_validation_action_exact_match": 0.323733862959285,
"best_validation__action_inter_exact_match": 0.08191126279863481,
"best_validation__action_turn_1_exact_match": 0.3856655290102389,
"best_validation__action_turn_2_exact_match": 0.3017543859649123,
"best_validation__action_turn_3_exact_match": 0.2786885245901639,
"best_validation__action_turn_4_exact_match": 0.31891891891891894,
"best_validation_sql_exact_match": 0.3227408142999007,
"best_validation__sql_inter_exact_match": 0.08532423208191127,
"best_validation__sql_turn_1_exact_match": 0.40273037542662116,
"best_validation__sql_turn_2_exact_match": 0.2912280701754386,
"best_validation__sql_turn_3_exact_match": 0.2786885245901639,
"best_validation__sql_turn_4_exact_match": 0.3027027027027027,
"best_validation__copy": 0,
"best_validation_info": 0,
"best_validation_loss": 0.40968313813209534
}
Pretrained Weights of CoSQL BERT-based Turn Model
{
"best_epoch": 23,
"peak_cpu_memory_MB": 0,
"peak_gpu_0_memory_MB": 1,
"peak_gpu_1_memory_MB": 3489,
"peak_gpu_2_memory_MB": 16884,
"peak_gpu_3_memory_MB": 16857,
"peak_gpu_4_memory_MB": 16886,
"peak_gpu_5_memory_MB": 16816,
"peak_gpu_6_memory_MB": 20163,
"peak_gpu_7_memory_MB": 19975,
"training_duration": "8:04:29.261273",
"training_start_epoch": 0,
"training_epochs": 32,
"epoch": 32,
"training_action_exact_match": 0,
"training__action_inter_exact_match": 0,
"training__action_turn_1_exact_match": 0,
"training__action_turn_2_exact_match": 0,
"training__action_turn_3_exact_match": 0,
"training__action_turn_4_exact_match": 0,
"training_sql_exact_match": 0,
"training__sql_inter_exact_match": 0,
"training__sql_turn_1_exact_match": 0,
"training__sql_turn_2_exact_match": 0,
"training__sql_turn_3_exact_match": 0,
"training__sql_turn_4_exact_match": 0,
"training_loss": 0.05288350063624136,
"training_cpu_memory_MB": 0.0,
"training_gpu_0_memory_MB": 1,
"training_gpu_1_memory_MB": 1751,
"training_gpu_2_memory_MB": 16884,
"training_gpu_3_memory_MB": 16857,
"training_gpu_4_memory_MB": 16886,
"training_gpu_5_memory_MB": 16816,
"training_gpu_6_memory_MB": 20163,
"training_gpu_7_memory_MB": 2,
"validation_action_exact_match": 0.3843098311817279,
"validation__action_inter_exact_match": 0.12286689419795221,
"validation__action_turn_1_exact_match": 0.48464163822525597,
"validation__action_turn_2_exact_match": 0.35789473684210527,
"validation__action_turn_3_exact_match": 0.3483606557377049,
"validation__action_turn_4_exact_match": 0.31351351351351353,
"validation_sql_exact_match": 0.38828202581926513,
"validation__sql_inter_exact_match": 0.1296928327645051,
"validation__sql_turn_1_exact_match": 0.49829351535836175,
"validation__sql_turn_2_exact_match": 0.3473684210526316,
"validation__sql_turn_3_exact_match": 0.36065573770491804,
"validation__sql_turn_4_exact_match": 0.31351351351351353,
"validation_loss": 0.24153371155261993,
"best_validation_action_exact_match": 0.38927507447864945,
"best_validation__action_inter_exact_match": 0.13651877133105803,
"best_validation__action_turn_1_exact_match": 0.47440273037542663,
"best_validation__action_turn_2_exact_match": 0.38596491228070173,
"best_validation__action_turn_3_exact_match": 0.3442622950819672,
"best_validation__action_turn_4_exact_match": 0.31891891891891894,
"best_validation_sql_exact_match": 0.39225422045680236,
"best_validation__sql_inter_exact_match": 0.14334470989761092,
"best_validation__sql_turn_1_exact_match": 0.4948805460750853,
"best_validation__sql_turn_2_exact_match": 0.3684210526315789,
"best_validation__sql_turn_3_exact_match": 0.36475409836065575,
"best_validation__sql_turn_4_exact_match": 0.3027027027027027,
"best_validation_loss": 0.20682337880134583
}
Pretrained Weights of CoSQL BERT-based Action Copy Model
{
"best_epoch": 11,
"peak_cpu_memory_MB": 0,
"peak_gpu_0_memory_MB": 1,
"peak_gpu_1_memory_MB": 3489,
"peak_gpu_2_memory_MB": 16884,
"peak_gpu_3_memory_MB": 16857,
"peak_gpu_4_memory_MB": 16886,
"peak_gpu_5_memory_MB": 16816,
"peak_gpu_6_memory_MB": 20163,
"peak_gpu_7_memory_MB": 19975,
"training_duration": "6:05:48.267567",
"training_start_epoch": 0,
"training_epochs": 20,
"epoch": 20,
"training_action_exact_match": 0,
"training__action_inter_exact_match": 0,
"training__action_turn_1_exact_match": 0,
"training__action_turn_2_exact_match": 0,
"training__action_turn_3_exact_match": 0,
"training__action_turn_4_exact_match": 0,
"training_sql_exact_match": 0,
"training__sql_inter_exact_match": 0,
"training__sql_turn_1_exact_match": 0,
"training__sql_turn_2_exact_match": 0,
"training__sql_turn_3_exact_match": 0,
"training__sql_turn_4_exact_match": 0,
"training__copy": 0,
"training_info": 0,
"training_loss": 0.07746467799366073,
"training_cpu_memory_MB": 0.0,
"training_gpu_0_memory_MB": 1,
"training_gpu_1_memory_MB": 3489,
"training_gpu_2_memory_MB": 16884,
"training_gpu_3_memory_MB": 16857,
"training_gpu_4_memory_MB": 16886,
"training_gpu_5_memory_MB": 16816,
"training_gpu_6_memory_MB": 20163,
"training_gpu_7_memory_MB": 19975,
"validation_action_exact_match": 0.407149950347567,
"validation__action_inter_exact_match": 0.12286689419795221,
"validation__action_turn_1_exact_match": 0.5085324232081911,
"validation__action_turn_2_exact_match": 0.3894736842105263,
"validation__action_turn_3_exact_match": 0.35655737704918034,
"validation__action_turn_4_exact_match": 0.34054054054054056,
"validation_sql_exact_match": 0.41211519364448856,
"validation__sql_inter_exact_match": 0.13993174061433447,
"validation__sql_turn_1_exact_match": 0.5324232081911263,
"validation__sql_turn_2_exact_match": 0.37894736842105264,
"validation__sql_turn_3_exact_match": 0.3770491803278688,
"validation__sql_turn_4_exact_match": 0.31891891891891894,
"validation__copy": 0,
"validation_info": 0,
"validation_loss": 0.16448146104812622,
"best_validation_action_exact_match": 0.42204568023833167,
"best_validation__action_inter_exact_match": 0.13993174061433447,
"best_validation__action_turn_1_exact_match": 0.515358361774744,
"best_validation__action_turn_2_exact_match": 0.39649122807017545,
"best_validation__action_turn_3_exact_match": 0.38524590163934425,
"best_validation__action_turn_4_exact_match": 0.3621621621621622,
"best_validation_sql_exact_match": 0.42105263157894735,
"best_validation__sql_inter_exact_match": 0.15358361774744028,
"best_validation__sql_turn_1_exact_match": 0.5290102389078498,
"best_validation__sql_turn_2_exact_match": 0.3824561403508772,
"best_validation__sql_turn_3_exact_match": 0.3975409836065574,
"best_validation__sql_turn_4_exact_match": 0.34054054054054056,
"best_validation__copy": 0,
"best_validation_info": 0,
"best_validation_loss": 0.1453363001346588
}
Pretrained Weights of SParC Concat Model
sparc.concat Initial SECURITY.md commit
Pretrained Weights of SParC BERT-based Concat Model
sparc.bert.concat Initial SECURITY.md commit
Pretrained Weights of CoSQL Concat Model
cosql.concat Initial SECURITY.md commit
Pretrained Weights of CoSQL BERT-based Concat Model
cosql.bert.concat Initial SECURITY.md commit