HaithemH's picture
Upload VJEPA2ForVideoClassification
de4357d verified
{
"architectures": [
"VJEPA2ForVideoClassification"
],
"attention_dropout": 0.0,
"attention_probs_dropout_prob": 0.0,
"crop_size": 256,
"drop_path_rate": 0.0,
"frames_per_clip": 16,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.0,
"hidden_size": 1024,
"id2label": {
"0": "Jump",
"1": "ApplyEyeMakeup",
"2": "ApplyLipstick",
"3": "Biking",
"4": "BlowDryHair",
"5": "BrushingTeeth",
"6": "CuttingInKitchen",
"7": "Haircut",
"8": "Hammering",
"9": "HandstandPushups",
"10": "HandstandWalking",
"11": "HeadMassage",
"12": "Knitting",
"13": "PlayingDaf",
"14": "Typing",
"15": "WalkingWithDog",
"16": "FallDown",
"17": "LyingDown",
"18": "SitDown",
"19": "Sitting",
"20": "StandUp",
"21": "Standing",
"22": "Walking",
"23": "DrinkAngry",
"24": "DrinkDisgust",
"25": "DrinkHappy",
"26": "DrinkNeutral",
"27": "DrinkSad",
"28": "PutonglassesAngry",
"29": "PutonglassesHappy",
"30": "PutonglassesNeutral",
"31": "PutonglassesSad",
"32": "PutonjacketAngry",
"33": "PutonjacketHappy",
"34": "PutonjacketNeutral",
"35": "PutonjacketSad",
"36": "ReadAngry",
"37": "ReadHappy",
"38": "ReadNeutral",
"39": "ReadSad",
"40": "SitdownAngry",
"41": "SitdownHappy",
"42": "SitdownNeutral",
"43": "SitdownSad",
"44": "StandupAngry",
"45": "StandupHappy",
"46": "StandupNeutral",
"47": "StandupSad",
"48": "TakeoffglassesAngry",
"49": "TakeoffglassesHappy",
"50": "TakeoffglassesNeutral",
"51": "TakeoffglassesSad",
"52": "TakeoffjacketAngry",
"53": "TakeoffjacketHappy",
"54": "TakeoffjacketNeutral",
"55": "TakeoffjacketSad",
"56": "WriteAngry",
"57": "WriteHappy",
"58": "WriteNeutral",
"59": "Waving",
"60": "Fighting",
"61": "Clapping",
"62": "WalkingWhileUsingPhone",
"63": "ClosingABook",
"64": "ClosingABox",
"65": "ClosingAClosetCabinet",
"66": "ClosingADoor",
"67": "ClosingALaptop",
"68": "ClosingARefrigerator",
"69": "ClosingAWindow",
"70": "DrinkingFromACupGlassBottle",
"71": "EatingASandwich",
"72": "FixingADoor",
"73": "FixingADoorknob",
"74": "FixingALight",
"75": "FixingAVacuum",
"76": "FixingTheirHair",
"77": "GraspingOntoADoorknob",
"78": "HoldingABag",
"79": "HoldingABlanket",
"80": "HoldingABook",
"81": "HoldingABox",
"82": "HoldingABroom",
"83": "HoldingACupGlassBottleOfSomething",
"84": "HoldingADish",
"85": "HoldingALaptop",
"86": "HoldingAMirror",
"87": "HoldingAPhoneCamera",
"88": "HoldingAPicture",
"89": "HoldingAPillow",
"90": "HoldingASandwich",
"91": "SomeoneIsRunningSomewhere",
"92": "SomeoneIsSmiling",
"93": "SomeoneIsSneezing",
"94": "SomeoneIsStandingUpFromSomewhere",
"95": "HoldingAShoeShoes",
"96": "HoldingATowelS",
"97": "HoldingAVacuum",
"98": "HoldingSomeClothes",
"99": "HoldingSomeFood",
"100": "HoldingSomeMedicine",
"101": "LaughingAtAPicture",
"102": "LaughingAtTelevision",
"103": "LyingOnABed",
"104": "LyingOnASofaCouch",
"105": "LyingOnTheFloor",
"106": "MakingASandwich",
"107": "OpeningABag",
"108": "OpeningABook",
"109": "OpeningABox",
"110": "OpeningAClosetCabinet",
"111": "OpeningADoor",
"112": "OpeningALaptop",
"113": "OpeningARefrigerator",
"114": "OpeningAWindow",
"115": "PlayingWithAPhoneCamera",
"116": "PouringSomethingIntoACupGlassBottle",
"117": "PuttingABagSomewhere",
"118": "PuttingABlanketSomewhere",
"119": "PuttingABookSomewhere",
"120": "PuttingABoxSomewhere",
"121": "PuttingABroomSomewhere",
"122": "PuttingACupGlassBottleSomewhere",
"123": "PuttingADishEsSomewhere",
"124": "PuttingALaptopSomewhere",
"125": "PuttingAPhoneCameraSomewhere",
"126": "PuttingAPictureSomewhere",
"127": "PuttingAPillowSomewhere",
"128": "PuttingASandwichSomewhere",
"129": "PuttingATowelSSomewhere",
"130": "PuttingClothesSomewhere",
"131": "PuttingGroceriesSomewhere",
"132": "PuttingOnShoeShoes",
"133": "PuttingShoesSomewhere",
"134": "PuttingSomeFoodSomewhere",
"135": "PuttingSomethingOnAShelf",
"136": "PuttingSomethingOnATable",
"137": "PuttingTheirPaperNotebookSomewhere",
"138": "ReachingForAndGrabbingAPicture",
"139": "SittingAtATable",
"140": "SittingInABed",
"141": "SittingInAChair",
"142": "SittingOnATable",
"143": "SittingOnSofaCouch",
"144": "SittingOnTheFloor",
"145": "SmilingAtABook",
"146": "SmilingInAMirror",
"147": "SnugglingWithABlanket",
"148": "SnugglingWithAPillow",
"149": "SomeoneIsAwakeningInBed",
"150": "SomeoneIsAwakeningSomewhere",
"151": "SomeoneIsCookingSomething",
"152": "SomeoneIsDressing",
"153": "SomeoneIsEatingSomething",
"154": "SomeoneIsGoingFromStandingToSitting",
"155": "SomeoneIsHoldingAPaperNotebook",
"156": "SomeoneIsLaughing",
"157": "StandingOnAChair",
"158": "SomeoneIsUndressing",
"159": "TakingABlanketFromSomewhere",
"160": "TakingABookFromSomewhere",
"161": "TakingABoxFromSomewhere",
"162": "TakingADishEsFromSomewhere",
"163": "TakingALaptopFromSomewhere",
"164": "TakingAPictureOfSomething",
"165": "TakingABagFromSomewhere",
"166": "TakingABroomFromSomewhere",
"167": "TakingACupGlassBottleFromSomewhere",
"168": "TakingAPhoneCameraFromSomewhere",
"169": "TakingAPillowFromSomewhere",
"170": "TakingASandwichFromSomewhere",
"171": "TakingATowelSFromSomewhere",
"172": "TakingAVacuumFromSomewhere",
"173": "TakingConsumingSomeMedicine",
"174": "TakingFoodFromSomewhere",
"175": "TakingOffSomeShoes",
"176": "TakingPaperNotebookFromSomewhere",
"177": "TakingShoesFromSomewhere",
"178": "TakingSomeClothesFromSomewhere",
"179": "TakingSomethingFromABox",
"180": "TalkingOnAPhoneCamera",
"181": "ThrowingABagSomewhere",
"182": "ThrowingABlanketSomewhere",
"183": "ThrowingABookSomewhere",
"184": "ThrowingABoxSomewhere",
"185": "ThrowingABroomSomewhere",
"186": "ThrowingAPillowSomewhere",
"187": "ThrowingATowelSSomewhere",
"188": "ThrowingClothesSomewhere",
"189": "ThrowingFoodSomewhere",
"190": "ThrowingShoesSomewhere",
"191": "ThrowingSomethingOnTheFloor",
"192": "TidyingAShelfOrSomethingOnAShelf",
"193": "TidyingSomeClothes",
"194": "TidyingSomethingOnTheFloor",
"195": "TidyingUpABlanketS",
"196": "TidyingUpAClosetCabinet",
"197": "TidyingUpATable",
"198": "TidyingUpATowelS",
"199": "TidyingUpWithABroom",
"200": "TurningOffALight",
"201": "TurningOnALight",
"202": "WalkingThroughADoorway",
"203": "WashADishDishes",
"204": "WashingACupGlassBottle",
"205": "WashingAMirror",
"206": "WashingATable",
"207": "WashingAWindow",
"208": "WashingSomeClothes",
"209": "WashingSomethingWithATowel",
"210": "WashingTheirHands",
"211": "WatchingALaptopOrSomethingOnALaptop",
"212": "WatchingLookingAtAPicture",
"213": "WatchingLookingOutsideOfAWindow",
"214": "WatchingReadingLookingAtABook",
"215": "WatchingSomethingSomeoneThemselvesInAMirror",
"216": "WatchingTelevision",
"217": "WorkingAtATable",
"218": "WorkingOnPaperNotebook",
"219": "WorkingPlayingOnALaptop"
},
"image_size": 256,
"in_chans": 3,
"initializer_range": 0.02,
"label2id": {
"ApplyEyeMakeup": 1,
"ApplyLipstick": 2,
"Biking": 3,
"BlowDryHair": 4,
"BrushingTeeth": 5,
"Clapping": 61,
"ClosingABook": 63,
"ClosingABox": 64,
"ClosingAClosetCabinet": 65,
"ClosingADoor": 66,
"ClosingALaptop": 67,
"ClosingARefrigerator": 68,
"ClosingAWindow": 69,
"CuttingInKitchen": 6,
"DrinkAngry": 23,
"DrinkDisgust": 24,
"DrinkHappy": 25,
"DrinkNeutral": 26,
"DrinkSad": 27,
"DrinkingFromACupGlassBottle": 70,
"EatingASandwich": 71,
"FallDown": 16,
"Fighting": 60,
"FixingADoor": 72,
"FixingADoorknob": 73,
"FixingALight": 74,
"FixingAVacuum": 75,
"FixingTheirHair": 76,
"GraspingOntoADoorknob": 77,
"Haircut": 7,
"Hammering": 8,
"HandstandPushups": 9,
"HandstandWalking": 10,
"HeadMassage": 11,
"HoldingABag": 78,
"HoldingABlanket": 79,
"HoldingABook": 80,
"HoldingABox": 81,
"HoldingABroom": 82,
"HoldingACupGlassBottleOfSomething": 83,
"HoldingADish": 84,
"HoldingALaptop": 85,
"HoldingAMirror": 86,
"HoldingAPhoneCamera": 87,
"HoldingAPicture": 88,
"HoldingAPillow": 89,
"HoldingASandwich": 90,
"HoldingAShoeShoes": 95,
"HoldingATowelS": 96,
"HoldingAVacuum": 97,
"HoldingSomeClothes": 98,
"HoldingSomeFood": 99,
"HoldingSomeMedicine": 100,
"Jump": 0,
"Knitting": 12,
"LaughingAtAPicture": 101,
"LaughingAtTelevision": 102,
"LyingDown": 17,
"LyingOnABed": 103,
"LyingOnASofaCouch": 104,
"LyingOnTheFloor": 105,
"MakingASandwich": 106,
"OpeningABag": 107,
"OpeningABook": 108,
"OpeningABox": 109,
"OpeningAClosetCabinet": 110,
"OpeningADoor": 111,
"OpeningALaptop": 112,
"OpeningARefrigerator": 113,
"OpeningAWindow": 114,
"PlayingDaf": 13,
"PlayingWithAPhoneCamera": 115,
"PouringSomethingIntoACupGlassBottle": 116,
"PutonglassesAngry": 28,
"PutonglassesHappy": 29,
"PutonglassesNeutral": 30,
"PutonglassesSad": 31,
"PutonjacketAngry": 32,
"PutonjacketHappy": 33,
"PutonjacketNeutral": 34,
"PutonjacketSad": 35,
"PuttingABagSomewhere": 117,
"PuttingABlanketSomewhere": 118,
"PuttingABookSomewhere": 119,
"PuttingABoxSomewhere": 120,
"PuttingABroomSomewhere": 121,
"PuttingACupGlassBottleSomewhere": 122,
"PuttingADishEsSomewhere": 123,
"PuttingALaptopSomewhere": 124,
"PuttingAPhoneCameraSomewhere": 125,
"PuttingAPictureSomewhere": 126,
"PuttingAPillowSomewhere": 127,
"PuttingASandwichSomewhere": 128,
"PuttingATowelSSomewhere": 129,
"PuttingClothesSomewhere": 130,
"PuttingGroceriesSomewhere": 131,
"PuttingOnShoeShoes": 132,
"PuttingShoesSomewhere": 133,
"PuttingSomeFoodSomewhere": 134,
"PuttingSomethingOnAShelf": 135,
"PuttingSomethingOnATable": 136,
"PuttingTheirPaperNotebookSomewhere": 137,
"ReachingForAndGrabbingAPicture": 138,
"ReadAngry": 36,
"ReadHappy": 37,
"ReadNeutral": 38,
"ReadSad": 39,
"SitDown": 18,
"SitdownAngry": 40,
"SitdownHappy": 41,
"SitdownNeutral": 42,
"SitdownSad": 43,
"Sitting": 19,
"SittingAtATable": 139,
"SittingInABed": 140,
"SittingInAChair": 141,
"SittingOnATable": 142,
"SittingOnSofaCouch": 143,
"SittingOnTheFloor": 144,
"SmilingAtABook": 145,
"SmilingInAMirror": 146,
"SnugglingWithABlanket": 147,
"SnugglingWithAPillow": 148,
"SomeoneIsAwakeningInBed": 149,
"SomeoneIsAwakeningSomewhere": 150,
"SomeoneIsCookingSomething": 151,
"SomeoneIsDressing": 152,
"SomeoneIsEatingSomething": 153,
"SomeoneIsGoingFromStandingToSitting": 154,
"SomeoneIsHoldingAPaperNotebook": 155,
"SomeoneIsLaughing": 156,
"SomeoneIsRunningSomewhere": 91,
"SomeoneIsSmiling": 92,
"SomeoneIsSneezing": 93,
"SomeoneIsStandingUpFromSomewhere": 94,
"SomeoneIsUndressing": 158,
"StandUp": 20,
"Standing": 21,
"StandingOnAChair": 157,
"StandupAngry": 44,
"StandupHappy": 45,
"StandupNeutral": 46,
"StandupSad": 47,
"TakeoffglassesAngry": 48,
"TakeoffglassesHappy": 49,
"TakeoffglassesNeutral": 50,
"TakeoffglassesSad": 51,
"TakeoffjacketAngry": 52,
"TakeoffjacketHappy": 53,
"TakeoffjacketNeutral": 54,
"TakeoffjacketSad": 55,
"TakingABagFromSomewhere": 165,
"TakingABlanketFromSomewhere": 159,
"TakingABookFromSomewhere": 160,
"TakingABoxFromSomewhere": 161,
"TakingABroomFromSomewhere": 166,
"TakingACupGlassBottleFromSomewhere": 167,
"TakingADishEsFromSomewhere": 162,
"TakingALaptopFromSomewhere": 163,
"TakingAPhoneCameraFromSomewhere": 168,
"TakingAPictureOfSomething": 164,
"TakingAPillowFromSomewhere": 169,
"TakingASandwichFromSomewhere": 170,
"TakingATowelSFromSomewhere": 171,
"TakingAVacuumFromSomewhere": 172,
"TakingConsumingSomeMedicine": 173,
"TakingFoodFromSomewhere": 174,
"TakingOffSomeShoes": 175,
"TakingPaperNotebookFromSomewhere": 176,
"TakingShoesFromSomewhere": 177,
"TakingSomeClothesFromSomewhere": 178,
"TakingSomethingFromABox": 179,
"TalkingOnAPhoneCamera": 180,
"ThrowingABagSomewhere": 181,
"ThrowingABlanketSomewhere": 182,
"ThrowingABookSomewhere": 183,
"ThrowingABoxSomewhere": 184,
"ThrowingABroomSomewhere": 185,
"ThrowingAPillowSomewhere": 186,
"ThrowingATowelSSomewhere": 187,
"ThrowingClothesSomewhere": 188,
"ThrowingFoodSomewhere": 189,
"ThrowingShoesSomewhere": 190,
"ThrowingSomethingOnTheFloor": 191,
"TidyingAShelfOrSomethingOnAShelf": 192,
"TidyingSomeClothes": 193,
"TidyingSomethingOnTheFloor": 194,
"TidyingUpABlanketS": 195,
"TidyingUpAClosetCabinet": 196,
"TidyingUpATable": 197,
"TidyingUpATowelS": 198,
"TidyingUpWithABroom": 199,
"TurningOffALight": 200,
"TurningOnALight": 201,
"Typing": 14,
"Walking": 22,
"WalkingThroughADoorway": 202,
"WalkingWhileUsingPhone": 62,
"WalkingWithDog": 15,
"WashADishDishes": 203,
"WashingACupGlassBottle": 204,
"WashingAMirror": 205,
"WashingATable": 206,
"WashingAWindow": 207,
"WashingSomeClothes": 208,
"WashingSomethingWithATowel": 209,
"WashingTheirHands": 210,
"WatchingALaptopOrSomethingOnALaptop": 211,
"WatchingLookingAtAPicture": 212,
"WatchingLookingOutsideOfAWindow": 213,
"WatchingReadingLookingAtABook": 214,
"WatchingSomethingSomeoneThemselvesInAMirror": 215,
"WatchingTelevision": 216,
"Waving": 59,
"WorkingAtATable": 217,
"WorkingOnPaperNotebook": 218,
"WorkingPlayingOnALaptop": 219,
"WriteAngry": 56,
"WriteHappy": 57,
"WriteNeutral": 58
},
"layer_norm_eps": 1e-06,
"mlp_ratio": 4,
"model_type": "vjepa2",
"num_attention_heads": 16,
"num_hidden_layers": 24,
"num_pooler_layers": 3,
"patch_size": 16,
"pred_hidden_size": 384,
"pred_mlp_ratio": 4.0,
"pred_num_attention_heads": 12,
"pred_num_hidden_layers": 12,
"pred_num_mask_tokens": 10,
"pred_zero_init_mask_tokens": true,
"problem_type": "single_label_classification",
"qkv_bias": true,
"torch_dtype": "float32",
"transformers_version": "4.54.0.dev0",
"tubelet_size": 2,
"use_SiLU": false,
"wide_SiLU": true
}