|
{ |
|
"dset_type": "vlp", |
|
"dset_name": "vlp", |
|
"domain_name": null, |
|
"model_id": "univtg", |
|
"exp_id": "omni_mini_aio_unified__epo3_f10_b10g1_s0.1_0.1", |
|
"device": 0, |
|
"gpu_id": 0, |
|
"debug": false, |
|
"seed": 2018, |
|
"local_rank": 0, |
|
"eval_split_name": "val", |
|
"data_ratio": 1.0, |
|
"results_root": "results", |
|
"num_workers": 8, |
|
"no_pin_memory": false, |
|
"bsz": 64, |
|
"n_epoch": 100, |
|
"max_es_cnt": 200, |
|
"lr": 0.0001, |
|
"lr_drop": 200, |
|
"lr_gamma": 0.1, |
|
"lr_warmup": 10.0, |
|
"wd": 0.0001, |
|
"grad_clip": 0.1, |
|
"span_loss_type": "l1", |
|
"b_loss_coef": 10.0, |
|
"g_loss_coef": 1.0, |
|
"eos_coef": 0.1, |
|
"f_loss_coef": 10.0, |
|
"s_loss_intra_coef": 0.1, |
|
"s_loss_inter_coef": 0.1, |
|
"main_metric": "[email protected]", |
|
"eval_mode": null, |
|
"eval_bsz": 32, |
|
"eval_epoch": 5, |
|
"eval_init": true, |
|
"save_interval": 5, |
|
"resume": "/data/home/qinghonglin/univtg/results/vlp-vlp/aio_unified_mini-clip-clip-2023_05_27_00/model_e0003.ckpt", |
|
"resume_dir": null, |
|
"resume_all": false, |
|
"start_epoch": null, |
|
"no_sort_results": false, |
|
"max_before_nms": 1000, |
|
"max_after_nms": 10, |
|
"conf_thd": 0.0, |
|
"nms_thd": 0.7, |
|
"use_cache": -1, |
|
"max_q_l": 75, |
|
"max_v_l": 75, |
|
"clip_length": 2.0, |
|
"clip_len_list": null, |
|
"max_windows": 5, |
|
"add_easy_negative": 1, |
|
"easy_negative_only": 1, |
|
"round_multiple": 1, |
|
"train_path": [ |
|
"data/qvhighlights/metadata/qvhighlights_train.jsonl", |
|
"data/charades/metadata/charades_train.jsonl", |
|
"data/ego4d/metadata/nlq_train.jsonl", |
|
"data/tacos/metadata/train.jsonl", |
|
"data/anet/metadata/train.jsonl", |
|
"data/didemo/metadata/train.jsonl" |
|
], |
|
"eval_path": "data/qvhighlights/metadata/qvhighlights_val.jsonl", |
|
"train_path_list": null, |
|
"eval_path_list": null, |
|
"feat_root_list": null, |
|
"no_norm_vfeat": false, |
|
"no_norm_tfeat": false, |
|
"v_feat_dirs": [ |
|
"vid_clip" |
|
], |
|
"t_feat_dir": "txt_clip", |
|
"v_feat_dim": 512, |
|
"t_feat_dim": 512, |
|
"ctx_mode": "video_tef", |
|
"v_feat_types": "clip", |
|
"t_feat_type": "clip", |
|
"position_embedding": "sine", |
|
"n_input_proj": 2, |
|
"temperature": 0.07, |
|
"enc_layers": 4, |
|
"sub_enc_layers": 2, |
|
"dec_layers": 2, |
|
"dim_feedforward": 1024, |
|
"hidden_dim": 512, |
|
"input_dropout": 0.5, |
|
"dropout": 0.0, |
|
"droppath": 0.1, |
|
"txt_drop_ratio": 0, |
|
"use_txt_pos": false, |
|
"nheads": 8, |
|
"num_queries": 10, |
|
"pre_norm": false, |
|
"set_cost_span": 10, |
|
"set_cost_giou": 1, |
|
"set_cost_class": 4, |
|
"saliency_margin": 0.2, |
|
"aux_loss": false, |
|
"max_segment_num": 20, |
|
"max_frame_num": 200, |
|
"top_percent": 0.02, |
|
"qfvs_vid_feature": "fps1", |
|
"qfvs_txt_feature": "query", |
|
"qfvs_dense_shot": -1, |
|
"qfvs_score_ensemble": -1, |
|
"qfvs_score_gather": -1, |
|
"qfvs_loss_gather": -1, |
|
"results_dir": "results/vlp-vlp/omni_mini_aio_unified__epo3_f10_b10g1_s0.1_0.1-clip-clip-2023_05_31_06" |
|
} |