Pretrained Weights of CoSQL BERT-based Turn Model
SivilTaram
released this
23 Apr 14:27
·
155 commits
to master
since this release
{
"best_epoch": 23,
"peak_cpu_memory_MB": 0,
"peak_gpu_0_memory_MB": 1,
"peak_gpu_1_memory_MB": 3489,
"peak_gpu_2_memory_MB": 16884,
"peak_gpu_3_memory_MB": 16857,
"peak_gpu_4_memory_MB": 16886,
"peak_gpu_5_memory_MB": 16816,
"peak_gpu_6_memory_MB": 20163,
"peak_gpu_7_memory_MB": 19975,
"training_duration": "8:04:29.261273",
"training_start_epoch": 0,
"training_epochs": 32,
"epoch": 32,
"training_action_exact_match": 0,
"training__action_inter_exact_match": 0,
"training__action_turn_1_exact_match": 0,
"training__action_turn_2_exact_match": 0,
"training__action_turn_3_exact_match": 0,
"training__action_turn_4_exact_match": 0,
"training_sql_exact_match": 0,
"training__sql_inter_exact_match": 0,
"training__sql_turn_1_exact_match": 0,
"training__sql_turn_2_exact_match": 0,
"training__sql_turn_3_exact_match": 0,
"training__sql_turn_4_exact_match": 0,
"training_loss": 0.05288350063624136,
"training_cpu_memory_MB": 0.0,
"training_gpu_0_memory_MB": 1,
"training_gpu_1_memory_MB": 1751,
"training_gpu_2_memory_MB": 16884,
"training_gpu_3_memory_MB": 16857,
"training_gpu_4_memory_MB": 16886,
"training_gpu_5_memory_MB": 16816,
"training_gpu_6_memory_MB": 20163,
"training_gpu_7_memory_MB": 2,
"validation_action_exact_match": 0.3843098311817279,
"validation__action_inter_exact_match": 0.12286689419795221,
"validation__action_turn_1_exact_match": 0.48464163822525597,
"validation__action_turn_2_exact_match": 0.35789473684210527,
"validation__action_turn_3_exact_match": 0.3483606557377049,
"validation__action_turn_4_exact_match": 0.31351351351351353,
"validation_sql_exact_match": 0.38828202581926513,
"validation__sql_inter_exact_match": 0.1296928327645051,
"validation__sql_turn_1_exact_match": 0.49829351535836175,
"validation__sql_turn_2_exact_match": 0.3473684210526316,
"validation__sql_turn_3_exact_match": 0.36065573770491804,
"validation__sql_turn_4_exact_match": 0.31351351351351353,
"validation_loss": 0.24153371155261993,
"best_validation_action_exact_match": 0.38927507447864945,
"best_validation__action_inter_exact_match": 0.13651877133105803,
"best_validation__action_turn_1_exact_match": 0.47440273037542663,
"best_validation__action_turn_2_exact_match": 0.38596491228070173,
"best_validation__action_turn_3_exact_match": 0.3442622950819672,
"best_validation__action_turn_4_exact_match": 0.31891891891891894,
"best_validation_sql_exact_match": 0.39225422045680236,
"best_validation__sql_inter_exact_match": 0.14334470989761092,
"best_validation__sql_turn_1_exact_match": 0.4948805460750853,
"best_validation__sql_turn_2_exact_match": 0.3684210526315789,
"best_validation__sql_turn_3_exact_match": 0.36475409836065575,
"best_validation__sql_turn_4_exact_match": 0.3027027027027027,
"best_validation_loss": 0.20682337880134583
}