Skip to content

Releases: microsoft/ContextualSP

LogiGAN: model and data

02 Nov 03:28
Compare
Choose a tag to compare

Training data and LogiGAN pretrained model.
The warmup pre-traing data is gen_train_A.json, and the continual adversarial pre-training data is gen_train_B.json (gen_train_B.json with elastic searched pseudo samples is stored in train_data_with_es/gen_train_src_es.jsonl).

lemon_data

24 Oct 03:03
361503f
Compare
Choose a tag to compare

LEMON dataset and pre-training corpus.

Pretrained Weights of Multi BERT-based RUN

27 Oct 06:57
1c2dda0
Compare
Choose a tag to compare
{
    "ROUGE": 0.8954699040374693,
    "_ROUGE1": 0.9248370079585566,
    "_ROUGE2": 0.8548729804396925,
    "EM": 0.4933385579937304,
    "_P1": 0.7443478260869565,
    "_R1": 0.6512335615693946,
    "F1": 0.694684366123703,
    "_P2": 0.6040515653775322,
    "_R2": 0.5369713506139154,
    "F2": 0.5685396504405605,
    "_P3": 0.515867089789061,
    "_R3": 0.4619306310071041,
    "F3": 0.48741126151946734,
    "_BLEU1": 0.9203424772022362,
    "_BLEU2": 0.8919446800461631,
    "_BLEU3": 0.8644065076063657,
    "BLEU4": 0.836555297206264,
    "loss": 0.012869063752786444
}

Pretrained Weights of Multi RUN

27 Oct 06:37
1c2dda0
Compare
Choose a tag to compare
{
    "ROUGE": 0.8761914250271031,
    "_ROUGE1": 0.9096109449987978,
    "_ROUGE2": 0.8299625766685176,
    "EM": 0.43260188087774293,
    "_P1": 0.663828689370485,
    "_R1": 0.5592870340180415,
    "F1": 0.6070901905267504,
    "_P2": 0.5118311660626732,
    "_R2": 0.43674397453387903,
    "F2": 0.4713156990724837,
    "_P3": 0.42003325833903943,
    "_R3": 0.3588800668616799,
    "F3": 0.38705606634216694,
    "_BLEU1": 0.9049646708813686,
    "_BLEU2": 0.8726836197111325,
    "_BLEU3": 0.8417857314177102,
    "BLEU4": 0.810576724115273,
    "loss": 0.01269258979597015
}

Pretrained Weights of Rewrite BERT-based RUN

27 Oct 01:46
Compare
Choose a tag to compare
{
    "ROUGE": 0.9394040084189113,
    "_ROUGE1": 0.961865057419486,
    "_ROUGE2": 0.9113051224617216,
    "EM": 0.688,
    "_P1": 0.9451903332806824,
    "_R1": 0.8668694770389685,
    "F1": 0.9043373129817137,
    "_P2": 0.8648273949812838,
    "_R2": 0.7989241803278688,
    "F2": 0.8305705345849144,
    "_P3": 0.8075098814229249,
    "_R3": 0.7449860216360763,
    "F3": 0.774988935954985,
    "_BLEU1": 0.9405510823944796,
    "_BLEU2": 0.9172718486250105,
    "_BLEU3": 0.8932687251641028,
    "BLEU4": 0.8691863201601382,
    "loss": 0.2084200546145439
}

Pretrained Weights of Rewrite RUN

27 Oct 01:47
Compare
Choose a tag to compare
{
    "ROUGE": 0.8927719935645371,
    "_ROUGE1": 0.9235141523874184,
    "_ROUGE2": 0.8481181915297369,
    "EM": 0.536,
    "_P1": 0.8750417083750417,
    "_R1": 0.7598145733738955,
    "F1": 0.8133674497945259,
    "_P2": 0.7759128386336867,
    "_R2": 0.6749487704918032,
    "F2": 0.7219178082191782,
    "_P3": 0.7060550971892043,
    "_R3": 0.6137109517442567,
    "F3": 0.6566523605150214,
    "_BLEU1": 0.8953007499145113,
    "_BLEU2": 0.8627271154439679,
    "_BLEU3": 0.8298150265279266,
    "BLEU4": 0.7961327186223426,
    "loss": 0.07524961760888497
}

Pretrained Weights of CANARD RUN

27 Oct 02:28
Compare
Choose a tag to compare
{
    "ROUGE": 0.7672702010110017,
    "_ROUGE1": 0.8060129493808116,
    "_ROUGE2": 0.6272019845050271,
    "EM": 0.1825525040387722,
    "_P1": 0.6173277359583093,
    "_R1": 0.34435562015503873,
    "F1": 0.44210035247771096,
    "_P2": 0.39885553659271156,
    "_R2": 0.24790964682391115,
    "F2": 0.3057682687497595,
    "_P3": 0.31307374374592123,
    "_R3": 0.20793481087641227,
    "F3": 0.24989581886373105,
    "_BLEU1": 0.7020165933536937,
    "_BLEU2": 0.6217319698491652,
    "_BLEU3": 0.5573085608208992,
    "BLEU4": 0.4977857601746373,
    "loss": 0.01892541069261615
}

Pretrained Weights of SParC Turn Model

21 Apr 07:21
Compare
Choose a tag to compare
{
  "best_epoch": 48,
  "peak_cpu_memory_MB": 0,
  "peak_gpu_0_memory_MB": 1,
  "peak_gpu_1_memory_MB": 3489,
  "peak_gpu_2_memory_MB": 16884,
  "peak_gpu_3_memory_MB": 16857,
  "peak_gpu_4_memory_MB": 16886,
  "peak_gpu_5_memory_MB": 16816,
  "peak_gpu_6_memory_MB": 20163,
  "peak_gpu_7_memory_MB": 19975,
  "training_duration": "8:57:20.749721",
  "training_start_epoch": 0,
  "training_epochs": 57,
  "epoch": 57,
  "training_action_exact_match": 0,
  "training__action_inter_exact_match": 0,
  "training__action_turn_1_exact_match": 0,
  "training__action_turn_2_exact_match": 0,
  "training__action_turn_3_exact_match": 0,
  "training__action_turn_4_exact_match": 0,
  "training_sql_exact_match": 0,
  "training__sql_inter_exact_match": 0,
  "training__sql_turn_1_exact_match": 0,
  "training__sql_turn_2_exact_match": 0,
  "training__sql_turn_3_exact_match": 0,
  "training__sql_turn_4_exact_match": 0,
  "training_loss": 0.03923457075834353,
  "training_cpu_memory_MB": 0.0,
  "training_gpu_0_memory_MB": 1,
  "training_gpu_1_memory_MB": 1751,
  "training_gpu_2_memory_MB": 16884,
  "training_gpu_3_memory_MB": 16857,
  "training_gpu_4_memory_MB": 16886,
  "training_gpu_5_memory_MB": 16816,
  "training_gpu_6_memory_MB": 20163,
  "training_gpu_7_memory_MB": 2,
  "validation_action_exact_match": 0.4056525353283458,
  "validation__action_inter_exact_match": 0.1966824644549763,
  "validation__action_turn_1_exact_match": 0.5521327014218009,
  "validation__action_turn_2_exact_match": 0.3767772511848341,
  "validation__action_turn_3_exact_match": 0.29259259259259257,
  "validation__action_turn_4_exact_match": 0.19101123595505617,
  "validation_sql_exact_match": 0.42726517040731504,
  "validation__sql_inter_exact_match": 0.2132701421800948,
  "validation__sql_turn_1_exact_match": 0.5592417061611374,
  "validation__sql_turn_2_exact_match": 0.3933649289099526,
  "validation__sql_turn_3_exact_match": 0.3296296296296296,
  "validation__sql_turn_4_exact_match": 0.25842696629213485,
  "validation_loss": 0.1820486258486621,
  "best_validation_action_exact_match": 0.4222776392352452,
  "best_validation__action_inter_exact_match": 0.2014218009478673,
  "best_validation__action_turn_1_exact_match": 0.5710900473933649,
  "best_validation__action_turn_2_exact_match": 0.3933649289099526,
  "best_validation__action_turn_3_exact_match": 0.3,
  "best_validation__action_turn_4_exact_match": 0.2247191011235955,
  "best_validation_sql_exact_match": 0.43557772236076475,
  "best_validation__sql_inter_exact_match": 0.2037914691943128,
  "best_validation__sql_turn_1_exact_match": 0.5687203791469194,
  "best_validation__sql_turn_2_exact_match": 0.3981042654028436,
  "best_validation__sql_turn_3_exact_match": 0.3296296296296296,
  "best_validation__sql_turn_4_exact_match": 0.30337078651685395,
  "best_validation_loss": 0.17382763872011436
}

Pretrained Weights of SParC Action Copy Model

21 Apr 07:30
Compare
Choose a tag to compare
{
  "best_epoch": 22,
  "peak_cpu_memory_MB": 0,
  "peak_gpu_0_memory_MB": 2796,
  "peak_gpu_1_memory_MB": 16881,
  "peak_gpu_2_memory_MB": 1479,
  "peak_gpu_3_memory_MB": 16586,
  "peak_gpu_4_memory_MB": 496,
  "peak_gpu_5_memory_MB": 1968,
  "peak_gpu_6_memory_MB": 496,
  "peak_gpu_7_memory_MB": 507,
  "training_duration": "5:31:39.494340",
  "training_start_epoch": 0,
  "training_epochs": 31,
  "epoch": 31,
  "training_action_exact_match": 0,
  "training__action_inter_exact_match": 0,
  "training__action_turn_1_exact_match": 0,
  "training__action_turn_2_exact_match": 0,
  "training__action_turn_3_exact_match": 0,
  "training__action_turn_4_exact_match": 0,
  "training_sql_exact_match": 0,
  "training__sql_inter_exact_match": 0,
  "training__sql_turn_1_exact_match": 0,
  "training__sql_turn_2_exact_match": 0,
  "training__sql_turn_3_exact_match": 0,
  "training__sql_turn_4_exact_match": 0,
  "training__copy": 0,
  "training_info": 0,
  "training_loss": 0.06896944765227608,
  "training_cpu_memory_MB": 0.0,
  "training_gpu_0_memory_MB": 2796,
  "training_gpu_1_memory_MB": 16879,
  "training_gpu_2_memory_MB": 1479,
  "training_gpu_3_memory_MB": 16586,
  "training_gpu_4_memory_MB": 496,
  "training_gpu_5_memory_MB": 1968,
  "training_gpu_6_memory_MB": 496,
  "training_gpu_7_memory_MB": 507,
  "validation_action_exact_match": 0.37323358270989193,
  "validation__action_inter_exact_match": 0.17535545023696683,
  "validation__action_turn_1_exact_match": 0.5165876777251185,
  "validation__action_turn_2_exact_match": 0.33886255924170616,
  "validation__action_turn_3_exact_match": 0.2851851851851852,
  "validation__action_turn_4_exact_match": 0.12359550561797752,
  "validation_sql_exact_match": 0.3873649210307564,
  "validation__sql_inter_exact_match": 0.1895734597156398,
  "validation__sql_turn_1_exact_match": 0.518957345971564,
  "validation__sql_turn_2_exact_match": 0.35545023696682465,
  "validation__sql_turn_3_exact_match": 0.3,
  "validation__sql_turn_4_exact_match": 0.1797752808988764,
  "validation__copy": 0,
  "validation_info": 0,
  "validation_loss": 0.13728585836002538,
  "best_validation_action_exact_match": 0.372402327514547,
  "best_validation__action_inter_exact_match": 0.18009478672985782,
  "best_validation__action_turn_1_exact_match": 0.5260663507109005,
  "best_validation__action_turn_2_exact_match": 0.33886255924170616,
  "best_validation__action_turn_3_exact_match": 0.25925925925925924,
  "best_validation__action_turn_4_exact_match": 0.14606741573033707,
  "best_validation_sql_exact_match": 0.38902743142144636,
  "best_validation__sql_inter_exact_match": 0.1966824644549763,
  "best_validation__sql_turn_1_exact_match": 0.5355450236966824,
  "best_validation__sql_turn_2_exact_match": 0.35545023696682465,
  "best_validation__sql_turn_3_exact_match": 0.2740740740740741,
  "best_validation__sql_turn_4_exact_match": 0.20224719101123595,
  "best_validation__copy": 0,
  "best_validation_info": 0,
  "best_validation_loss": 0.13164386158200506
}

Pretrained Weights of SParC BERT-based Turn Model

23 Apr 13:55
Compare
Choose a tag to compare
{
  "best_epoch": 45,
  "peak_cpu_memory_MB": 0,
  "peak_gpu_0_memory_MB": 1,
  "peak_gpu_1_memory_MB": 4185,
  "peak_gpu_2_memory_MB": 16884,
  "peak_gpu_3_memory_MB": 16857,
  "peak_gpu_4_memory_MB": 16886,
  "peak_gpu_5_memory_MB": 16816,
  "peak_gpu_6_memory_MB": 22499,
  "peak_gpu_7_memory_MB": 20477,
  "training_duration": "15:38:25.817253",
  "training_start_epoch": 0,
  "training_epochs": 54,
  "epoch": 54,
  "training_action_exact_match": 0,
  "training__action_inter_exact_match": 0,
  "training__action_turn_1_exact_match": 0,
  "training__action_turn_2_exact_match": 0,
  "training__action_turn_3_exact_match": 0,
  "training__action_turn_4_exact_match": 0,
  "training_sql_exact_match": 0,
  "training__sql_inter_exact_match": 0,
  "training__sql_turn_1_exact_match": 0,
  "training__sql_turn_2_exact_match": 0,
  "training__sql_turn_3_exact_match": 0,
  "training__sql_turn_4_exact_match": 0,
  "training_loss": 0.03840326214035231,
  "training_cpu_memory_MB": 0.0,
  "training_gpu_0_memory_MB": 1,
  "training_gpu_1_memory_MB": 3238,
  "training_gpu_2_memory_MB": 16884,
  "training_gpu_3_memory_MB": 16857,
  "training_gpu_4_memory_MB": 16886,
  "training_gpu_5_memory_MB": 2,
  "training_gpu_6_memory_MB": 22499,
  "training_gpu_7_memory_MB": 20477,
  "validation_action_exact_match": 0.4405652535328346,
  "validation__action_inter_exact_match": 0.23459715639810427,
  "validation__action_turn_1_exact_match": 0.6018957345971564,
  "validation__action_turn_2_exact_match": 0.4218009478672986,
  "validation__action_turn_3_exact_match": 0.2962962962962963,
  "validation__action_turn_4_exact_match": 0.20224719101123595,
  "validation_sql_exact_match": 0.46467165419783873,
  "validation__sql_inter_exact_match": 0.26303317535545023,
  "validation__sql_turn_1_exact_match": 0.6184834123222749,
  "validation__sql_turn_2_exact_match": 0.45260663507109006,
  "validation__sql_turn_3_exact_match": 0.32592592592592595,
  "validation__sql_turn_4_exact_match": 0.21348314606741572,
  "validation_loss": 0.20552104420625325,
  "best_validation_action_exact_match": 0.4513715710723192,
  "best_validation__action_inter_exact_match": 0.23933649289099526,
  "best_validation__action_turn_1_exact_match": 0.6137440758293838,
  "best_validation__action_turn_2_exact_match": 0.43364928909952605,
  "best_validation__action_turn_3_exact_match": 0.28888888888888886,
  "best_validation__action_turn_4_exact_match": 0.25842696629213485,
  "best_validation_sql_exact_match": 0.4696591853699086,
  "best_validation__sql_inter_exact_match": 0.26303317535545023,
  "best_validation__sql_turn_1_exact_match": 0.6255924170616114,
  "best_validation__sql_turn_2_exact_match": 0.45734597156398105,
  "best_validation__sql_turn_3_exact_match": 0.3148148148148148,
  "best_validation__sql_turn_4_exact_match": 0.25842696629213485,
  "best_validation_loss": 0.18703062564368952
}