{ "_name_or_path": "model", "architectures": [ "ViTForImageClassification" ], "attention_probs_dropout_prob": 0.0, "encoder_stride": 16, "hidden_act": "gelu", "hidden_dropout_prob": 0.0, "hidden_size": 768, "id2label": [ "arms_akimbo", "biting_nails", "buckle_button,_pulling_shirt_collar,_adjusting_tie", "bulging_face,_deep_breath", "covering_face", "crossing_fingers", "dustoffing_clothes", "folding_arms", "head_up", "hold_back_arms", "illustrative_body_language", "minaret_gesture", "moving_torso", "playing_with_or_adjusting_hair", "playing_with_or_manipulating_objects", "pressing_lips", "putting_arms_behind_body", "rubbing_eyes", "rubbing_or_holding_hands", "scratching_back", "scratching_or_touching_arms", "shaking_shoulders", "sitting_upright", "touching_ears", "touching_hat", "touching_jaw", "touching_or_covering_suprasternal_notch", "touching_or_scratching_facial_parts", "touching_or_scratching_forehead", "touching_or_scratching_head", "touching_or_scratching_neck", "turtle_neck" ], "image_size": 224, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "arms_akimbo": 0, "biting_nails": 1, "buckle_button,_pulling_shirt_collar,_adjusting_tie": 2, "bulging_face,_deep_breath": 3, "covering_face": 4, "crossing_fingers": 5, "dustoffing_clothes": 6, "folding_arms": 7, "head_up": 8, "hold_back_arms": 9, "illustrative_body_language": 10, "minaret_gesture": 11, "moving_torso": 12, "playing_with_or_adjusting_hair": 13, "playing_with_or_manipulating_objects": 14, "pressing_lips": 15, "putting_arms_behind_body": 16, "rubbing_eyes": 17, "rubbing_or_holding_hands": 18, "scratching_back": 19, "scratching_or_touching_arms": 20, "shaking_shoulders": 21, "sitting_upright": 22, "touching_ears": 23, "touching_hat": 24, "touching_jaw": 25, "touching_or_covering_suprasternal_notch": 26, "touching_or_scratching_facial_parts": 27, "touching_or_scratching_forehead": 28, "touching_or_scratching_head": 29, "touching_or_scratching_neck": 30, "turtle_neck": 31 }, "layer_norm_eps": 1e-12, "model_type": "vit", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "patch_size": 16, "problem_type": "single_label_classification", "qkv_bias": true, "torch_dtype": "float32", "transformers_version": "4.39.2" }