Fast3R_ViT_Large_512 / config.json
jedyang97's picture
Push model using huggingface_hub.
3d60223 verified
raw
history blame contribute delete
941 Bytes
{
"decoder_args": {
"attn_bias_for_inference_enabled": false,
"attn_drop": 0.0,
"attn_implementation": "flash_attention",
"decoder_type": "fast3r",
"depth": 24,
"drop": 0.0,
"embed_dim": 1024,
"enc_embed_dim": 1024,
"mlp_ratio": 4.0,
"num_heads": 16,
"qkv_bias": true,
"random_image_idx_embedding": true
},
"encoder_args": {
"attn_implementation": "flash_attention",
"depth": 24,
"embed_dim": 1024,
"encoder_type": "croco",
"img_size": 512,
"mlp_ratio": 4,
"num_heads": 16,
"patch_embed_cls": "PatchEmbedDust3R",
"patch_size": 16,
"pos_embed": "RoPE100"
},
"head_args": {
"conf_mode": [
"exp",
1,
Infinity
],
"depth_mode": [
"exp",
-Infinity,
Infinity
],
"head_type": "dpt",
"landscape_only": false,
"output_mode": "pts3d",
"patch_size": 16,
"with_local_head": true
}
}