lightningdot
copied
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
Readme
Files and versions
191 lines
4.4 KiB
191 lines
4.4 KiB
{
|
|
"compressed_db": false,
|
|
"txt_model_type": "bert-base",
|
|
"txt_model_config": "bert-base-cased",
|
|
"img_model_type": "uniter-base",
|
|
"img_model_config": "./config/img_base.json",
|
|
"model_config": "./config/img_base.json",
|
|
"output_dir": "/storage/pretrain/alltask_ot_alldata_base",
|
|
"project_dim": 768,
|
|
"mrm_prob": 0.15,
|
|
"neg_size": 128,
|
|
"nce_temp": 1.0,
|
|
"itm_neg_prob": 0.0,
|
|
"itm_ot_lambda": 0.0,
|
|
"max_txt_len": 60,
|
|
"conf_th": 0.2,
|
|
"max_bb": 100,
|
|
"min_bb": 10,
|
|
"num_bb": 36,
|
|
"train_batch_size": 10240,
|
|
"val_batch_size": 10240,
|
|
"gradient_accumulation_steps": 6,
|
|
"learning_rate": 5e-05,
|
|
"valid_steps": 10000,
|
|
"num_train_steps": 300000,
|
|
"optim": "adamw",
|
|
"betas": [
|
|
0.9,
|
|
0.98
|
|
],
|
|
"decay": "linear",
|
|
"dropout": 0.1,
|
|
"weight_decay": 0.01,
|
|
"grad_norm": 5.0,
|
|
"warmup_steps": 10000,
|
|
"seed": 42,
|
|
"fp16": true,
|
|
"n_workers": 3,
|
|
"pin_mem": true,
|
|
"train_datasets": [
|
|
{
|
|
"name": "coco_cap",
|
|
"db": [
|
|
"./data/db/pretrain_caption_coco_train_base-cased.db/",
|
|
"./data/db/pretrain_caption_coco_trainval_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/coco_train2014/",
|
|
"./data/img/coco_val2014/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
],
|
|
"mix_ratio": [
|
|
16,
|
|
8,
|
|
4,
|
|
4
|
|
]
|
|
},
|
|
{
|
|
"name": "vg_cap",
|
|
"db": [
|
|
"./data/db/pretrain_caption_vg_train_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/vg/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
],
|
|
"mix_ratio": [
|
|
16,
|
|
12,
|
|
6,
|
|
6
|
|
]
|
|
},
|
|
{
|
|
"name": "cc",
|
|
"db": [
|
|
"./data/db/conceptual_caption_train_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/gcc_train/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
],
|
|
"mix_ratio": [
|
|
16,
|
|
12,
|
|
6,
|
|
6
|
|
]
|
|
},
|
|
{
|
|
"name": "sbu",
|
|
"db": [
|
|
"./data/db/sbu_caption_train_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/sbu/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
],
|
|
"mix_ratio": [
|
|
16,
|
|
8,
|
|
4,
|
|
4
|
|
]
|
|
}
|
|
],
|
|
"val_datasets": [
|
|
{
|
|
"name": "coco_cap",
|
|
"db": [
|
|
"./data/db/pretrain_caption_coco_val_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/coco_val2014/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
]
|
|
},
|
|
{
|
|
"name": "vg_cap",
|
|
"db": [
|
|
"./data/db/pretrain_caption_vg_val_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/vg/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
]
|
|
},
|
|
{
|
|
"name": "cc",
|
|
"db": [
|
|
"./data/db/conceptual_caption_val_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/gcc_val/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
]
|
|
},
|
|
{
|
|
"name": "sbu",
|
|
"db": [
|
|
"./data/db/sbu_caption_val_base-cased.db/"
|
|
],
|
|
"img": [
|
|
"./data/img/sbu/"
|
|
],
|
|
"tasks": [
|
|
"itm",
|
|
"mlm",
|
|
"mrfr",
|
|
"mrckl"
|
|
]
|
|
}
|
|
],
|
|
"rank": 0
|
|
}
|