AM-DETR / config.json
lighthouse-emnlp2024's picture
Add scripts
5a8f38f
{
"auto_map": {
"AutoConfig": "configuration_amdetr.AMDETRConfig",
"AutoModel": "modeling_amdetr.AMDETRPredictorWrapper"
},
"a_feat_dim": 768,
"a_feat_dirs": [
"features/clotho-moment/clap"
],
"a_feat_types": "clap",
"architectures": [
"AMDETRPredictorWrapper"
],
"aux_loss": true,
"bsz": 32,
"ckpt_filename": "best.ckpt",
"ckpt_filepath": "results/qd_detr/clotho-moment/clap/best.ckpt",
"clip_length": 1,
"ctx_mode": "audio_tef",
"dec_layers": 2,
"device": "cpu",
"dim_feedforward": 1024,
"dropout": 0.1,
"dset_name": "clotho-moment",
"ema_decay": 0.9,
"enc_layers": 2,
"eos_coef": 0.1,
"eval_bsz": 100,
"eval_epoch_interval": 1,
"eval_log_filename": "val.log",
"eval_log_filepath": "results/qd_detr/clotho-moment/clap/val.log",
"eval_log_txt_formatter": "{time_str} [Epoch] {epoch:03d} [Loss] {loss_str} [Metrics] {eval_metrics_str}\n",
"eval_path": "data/clotho_moment/clotho_moment_val_release.jsonl",
"eval_split_name": "val",
"giou_loss_coef": 1,
"grad_clip": 0.1,
"hidden_dim": 256,
"input_dropout": 0.5,
"kwargs": {},
"label_loss_coef": 4,
"lr": 0.0001,
"lr_drop": 400,
"lw_saliency": 1,
"max_es_cnt": 200,
"max_q_l": 32,
"max_v_l": 75,
"max_windows": 5,
"model_ema": false,
"model_name": "qd_detr",
"model_type": "amdetr",
"n_epoch": 100,
"n_input_proj": 2,
"nheads": 8,
"num_queries": 10,
"num_workers": 4,
"position_embedding": "sine",
"results_dir": "results/qd_detr/clotho-moment/clap",
"saliency_margin": 0.2,
"seed": 2023,
"set_cost_class": 4,
"set_cost_giou": 1,
"set_cost_span": 10,
"span_loss_coef": 10,
"span_loss_type": "l1",
"t_feat_dim": 768,
"t_feat_dir": "features/clotho-moment/clap_text",
"t_feat_dir_pretrain_eval": null,
"t_feat_type": "clap",
"torch_dtype": "float32",
"train_log_filename": "train.log",
"train_log_filepath": "results/qd_detr/clotho-moment/clap/train.log",
"train_log_txt_formatter": "{time_str} [Epoch] {epoch:03d} [Loss] {loss_str}\n",
"train_path": "data/clotho_moment/clotho_moment_train_release.jsonl",
"transformers_version": "4.51.3",
"v_feat_dim": 2,
"v_feat_dirs": null,
"v_feat_types": null,
"wd": 0.0001
}