{ "architectures": [ "SiglipForImageClassification" ], "id2label": { "0": "None", "1": "abstract", "2": "advertisement", "3": "allegorical painting", "4": "animal painting", "5": "battle painting", "6": "bijinga", "7": "bird-and-flower painting", "8": "calligraphy", "9": "capriccio", "10": "caricature", "11": "cityscape", "12": "cloudscape", "13": "design", "14": "figurative", "15": "flower painting", "16": "genre painting", "17": "history painting", "18": "illustration", "19": "interior", "20": "landscape", "21": "literary painting", "22": "marina", "23": "miniature", "24": "mythological painting", "25": "nude painting (nu)", "26": "panorama", "27": "pastorale", "28": "portrait", "29": "poster", "30": "quadratura", "31": "religious painting", "32": "self-portrait", "33": "shan shui", "34": "sketch and study", "35": "still life", "36": "symbolic painting", "37": "tessellation", "38": "urushi-e", "39": "vanitas", "40": "veduta", "41": "wildlife painting", "42": "yakusha-e" }, "initializer_factor": 1.0, "label2id": { "None": 0, "abstract": 1, "advertisement": 2, "allegorical painting": 3, "animal painting": 4, "battle painting": 5, "bijinga": 6, "bird-and-flower painting": 7, "calligraphy": 8, "capriccio": 9, "caricature": 10, "cityscape": 11, "cloudscape": 12, "design": 13, "figurative": 14, "flower painting": 15, "genre painting": 16, "history painting": 17, "illustration": 18, "interior": 19, "landscape": 20, "literary painting": 21, "marina": 22, "miniature": 23, "mythological painting": 24, "nude painting (nu)": 25, "panorama": 26, "pastorale": 27, "portrait": 28, "poster": 29, "quadratura": 30, "religious painting": 31, "self-portrait": 32, "shan shui": 33, "sketch and study": 34, "still life": 35, "symbolic painting": 36, "tessellation": 37, "urushi-e": 38, "vanitas": 39, "veduta": 40, "wildlife painting": 41, "yakusha-e": 42 }, "model_type": "siglip", "problem_type": "single_label_classification", "text_config": { "attention_dropout": 0.0, "hidden_act": "gelu_pytorch_tanh", "hidden_size": 768, "intermediate_size": 3072, "layer_norm_eps": 1e-06, "max_position_embeddings": 64, "model_type": "siglip_text_model", "num_attention_heads": 12, "num_hidden_layers": 12, "projection_size": 768, "torch_dtype": "float32", "vocab_size": 256000 }, "torch_dtype": "float32", "transformers_version": "4.50.0", "vision_config": { "attention_dropout": 0.0, "hidden_act": "gelu_pytorch_tanh", "hidden_size": 768, "image_size": 224, "intermediate_size": 3072, "layer_norm_eps": 1e-06, "model_type": "siglip_vision_model", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "patch_size": 16, "torch_dtype": "float32" } }