From 7678cac37187577c97606fe599970afee11d4448 Mon Sep 17 00:00:00 2001 From: dinhanhx Date: Thu, 19 Aug 2021 18:09:35 +0700 Subject: [PATCH] Add config files --- .../train-hm-base-hextuple-hpc_0_imgcap.json | 43 +++++++++++++++++++ ...hm-base-hextuple-hpc_0_imgcap_HimariO.json | 43 +++++++++++++++++++ .../train-hm-base-quadruple-hpc_0_imgcap.json | 43 +++++++++++++++++++ ...m-base-quadruple-hpc_0_imgcap_HimariO.json | 43 +++++++++++++++++++ .../train-hm-base-triple-hpc_0_imgcap.json | 43 +++++++++++++++++++ .../train-hm-base-triple-hpc_0_imgcap_2.json | 43 +++++++++++++++++++ .../train-hm-large-triple-hpc_0_imgcap.json | 43 +++++++++++++++++++ .../train-hm-large-triple-hpc_0_imgcap_2.json | 43 +++++++++++++++++++ ...n-hm-base-triple-hpc_0_imgcap_HimariO.json | 43 +++++++++++++++++++ ...e-hpc_0_imgcap_bert-base-cased_insert.json | 43 +++++++++++++++++++ ...c_0_imgcap_bert-base-cased_substitute.json | 43 +++++++++++++++++++ ...0_imgcap_bert-base-uncased_substitute.json | 43 +++++++++++++++++++ ...imgcap_distilbert-base-uncased_insert.json | 43 +++++++++++++++++++ ...ap_distilbert-base-uncased_substitute.json | 43 +++++++++++++++++++ ...pc_0_imgcap_distilroberta-base_insert.json | 43 +++++++++++++++++++ ..._imgcap_distilroberta-base_substitute.json | 43 +++++++++++++++++++ ...-hpc_0_imgcap_xlnet-base-cased_insert.json | 43 +++++++++++++++++++ ..._0_imgcap_xlnet-base-cased_substitute.json | 43 +++++++++++++++++++ .../train-hm-large-pa-1gpu-hpc_0_3420.json | 43 +++++++++++++++++++ .../train-hm-large-pa-1gpu-hpc_0_3420_2.json | 43 +++++++++++++++++++ 20 files changed, 860 insertions(+) create mode 100644 UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap.json create mode 100644 UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap_HimariO.json create mode 100644 UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap.json create mode 100644 UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap_HimariO.json create mode 100644 UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap.json create mode 100644 UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap_2.json create mode 100644 UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap.json create mode 100644 UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap_2.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_HimariO/train-hm-base-triple-hpc_0_imgcap_HimariO.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_insert.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_substitute.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-uncased_substitute.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_insert.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_substitute.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_insert.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_substitute.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_insert.json create mode 100644 UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_substitute.json create mode 100644 UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420.json create mode 100644 UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420_2.json diff --git a/UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap.json b/UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap.json new file mode 100644 index 0000000..8eab394 --- /dev/null +++ b/UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "hextuple", + "use_img_type": false, + "output_dir": "../model_asset/output_hextuple_dev_seen_unseen_0_imgcap/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap_HimariO.json b/UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap_HimariO.json new file mode 100644 index 0000000..00cf525 --- /dev/null +++ b/UNITER/config/dax/hextuple_attn/train-hm-base-hextuple-hpc_0_imgcap_HimariO.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"HimariO_annotations/data_test.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "hextuple", + "use_img_type": false, + "output_dir": "../model_asset/output_hextuple_dev_seen_unseen_0_imgcap_HimariO/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap.json b/UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap.json new file mode 100644 index 0000000..b2ee074 --- /dev/null +++ b/UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "quadruple", + "use_img_type": false, + "output_dir": "../model_asset/output_quadruple_dev_seen_unseen_0_imgcap/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap_HimariO.json b/UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap_HimariO.json new file mode 100644 index 0000000..b24cd8d --- /dev/null +++ b/UNITER/config/dax/quadruple_attn/train-hm-base-quadruple-hpc_0_imgcap_HimariO.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"HimariO_annotations/data_test.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "quadruple", + "use_img_type": false, + "output_dir": "../model_asset/output_quadruple_dev_seen_unseen_0_imgcap_HimariO/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap.json b/UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap.json new file mode 100644 index 0000000..1ca03f4 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap_2.json b/UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap_2.json new file mode 100644 index 0000000..e4c6daf --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/train-hm-base-triple-hpc_0_imgcap_2.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption_2.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_2/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 2145, + "val_batch_size": 2496, + "gradient_accumulation_steps": 3, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap.json b/UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap.json new file mode 100644 index 0000000..df15811 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-large.pt", + "model_config": "./config/uniter-large.json", + "model": "triple_para", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap/hm/large", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 2150, + "val_batch_size": 2496, + "gradient_accumulation_steps": 3, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": false +} diff --git a/UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap_2.json b/UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap_2.json new file mode 100644 index 0000000..fa97dc5 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/train-hm-large-triple-hpc_0_imgcap_2.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption_2.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-large.pt", + "model_config": "./config/uniter-large.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_2/hm/large", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 2145, + "val_batch_size": 2496, + "gradient_accumulation_steps": 3, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_HimariO/train-hm-base-triple-hpc_0_imgcap_HimariO.json b/UNITER/config/dax/triple_cyclic/with_imgcap_HimariO/train-hm-base-triple-hpc_0_imgcap_HimariO.json new file mode 100644 index 0000000..6d29274 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_HimariO/train-hm-base-triple-hpc_0_imgcap_HimariO.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"HimariO_annotations/data_test.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_HimariO/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_insert.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_insert.json new file mode 100644 index 0000000..33afc10 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_insert.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-cased_insert.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_bert-base-cased_insert/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_substitute.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_substitute.json new file mode 100644 index 0000000..ca8ff9c --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-cased_substitute.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-cased_substitute.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_bert-base-cased_substitute/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-uncased_substitute.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-uncased_substitute.json new file mode 100644 index 0000000..0434ec6 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_bert-base-uncased_substitute.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_bert-base-uncased_substitute.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_bert-base-uncased_substitute/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_insert.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_insert.json new file mode 100644 index 0000000..1f2aae0 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_insert.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_distilbert-base-uncased_insert.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_distilbert-base-uncased_insert/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_substitute.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_substitute.json new file mode 100644 index 0000000..a23a15d --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilbert-base-uncased_substitute.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_distilbert-base-uncased_substitute.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_distilbert-base-uncased_substitute/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_insert.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_insert.json new file mode 100644 index 0000000..d591e38 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_insert.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_distilroberta-base_insert.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_distilroberta-base_insert/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_substitute.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_substitute.json new file mode 100644 index 0000000..e2bcf6f --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_distilroberta-base_substitute.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_distilroberta-base_substitute.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_distilroberta-base_substitute/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_insert.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_insert.json new file mode 100644 index 0000000..8b5ab0f --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_insert.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_xlnet-base-cased_insert.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_xlnet-base-cased_insert/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_substitute.json b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_substitute.json new file mode 100644 index 0000000..fff7dc9 --- /dev/null +++ b/UNITER/config/dax/triple_cyclic/with_imgcap_nlpqug/train-hm-base-triple-hpc_0_imgcap_xlnet-base-cased_substitute.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file":"textaug/data_test_paraphrased_nlpaug_xlnet-base-cased_substitute.jsonl", + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-base.pt", + "model_config": "./config/uniter-base.json", + "model": "triple", + "use_img_type": false, + "output_dir": "../model_asset/output_triple_dev_seen_unseen_0_imgcap_xlnet-base-cased_substitute/hm/base", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 3328, + "val_batch_size": 2496, + "gradient_accumulation_steps": 2, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420.json b/UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420.json new file mode 100644 index 0000000..fb4d7a5 --- /dev/null +++ b/UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption.csv", + "paraphrased_file": null, + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-large.pt", + "model_config": "./config/uniter-large.json", + "model": "paired-attn", + "use_img_type": false, + "output_dir": "../model_asset/with_imgcap/ph2_output_pa_dev_seen_unseen_0_3420/hm/large", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 1664, + "val_batch_size": 10240, + "gradient_accumulation_steps": 4, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +} diff --git a/UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420_2.json b/UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420_2.json new file mode 100644 index 0000000..9cc8816 --- /dev/null +++ b/UNITER/config/dax/with_imgcap/train-hm-large-pa-1gpu-hpc_0_3420_2.json @@ -0,0 +1,43 @@ +{ + "root_path": "./", + "dataset_path": "../data", + "precomputed_boxes": { + "train": "data_train_d2_10-100_vg.tsv", + "dev": "data_dev_seen_unseen_d2_10-100_vg.tsv", + "test": "data_test_seen_d2_10-100_vg.tsv" + }, + "captions_file": "imgcap/hm_caption_2.csv", + "paraphrased_file": null, + "train_image_set": "train+dev", + "val_image_set": "dev", + "test_image_set": "test", + "checkpoint": "../UNITER/storage/pretrained/uniter-large.pt", + "model_config": "./config/uniter-large.json", + "model": "paired-attn", + "use_img_type": false, + "output_dir": "../model_asset/with_imgcap/ph2_output_pa_dev_seen_unseen_0_3420_2/hm/large", + "max_txt_len": 100, + "conf_th": 0.2, + "max_bb": 100, + "min_bb": 10, + "num_bb": 36, + "train_batch_size": 1664, + "val_batch_size": 10240, + "gradient_accumulation_steps": 4, + "learning_rate": 2e-05, + "valid_steps": 285, + "num_train_steps": 3420, + "optim": "adamw", + "betas": [ + 0.9, + 0.98 + ], + "dropout": 0.2, + "weight_decay": 0.01, + "grad_norm": 2.0, + "warmup_steps": 285, + "seed": 0, + "fp16": true, + "n_workers": 4, + "pin_mem": true +}