{ "_name_or_path": "MCG-NJU/videomae-base", "architectures": [ "VideoMAEForVideoClassification" ], "attention_probs_dropout_prob": 0.0, "decoder_hidden_size": 384, "decoder_intermediate_size": 1536, "decoder_num_attention_heads": 6, "decoder_num_hidden_layers": 4, "hidden_act": "gelu", "hidden_dropout_prob": 0.0, "hidden_size": 768, "id2label": { "0": "0", "1": "1", "2": "2", "3": "3", "4": "4", "5": "5", "6": "6", "7": "7", "8": "8", "9": "9", "10": "10", "11": "A", "12": "B", "13": "C", "14": "D", "15": "E", "16": "F", "17": "G", "18": "H", "19": "I", "20": "J", "21": "K", "22": "L", "23": "M", "24": "N", "25": "O", "26": "P", "27": "Q", "28": "R", "29": "S", "30": "T", "31": "U", "32": "V", "33": "W", "34": "X", "35": "Y", "36": "Z", "37": "3g", "38": "4g", "39": "accident", "40": "accompany", "41": "action", "42": "address", "43": "advantage", "44": "advertise", "45": "age", "46": "aim", "47": "alchol", "48": "alcholic", "49": "almond", "50": "app", "51": "applause", "52": "applicant", "53": "application", "54": "association", "55": "attitude", "56": "automatic", "57": "avalanche", "58": "back", "59": "background", "60": "balance", "61": "ban", "62": "bill", "63": "birth", "64": "birthday", "65": "borrow", "66": "braille", "67": "branch", "68": "cheque", "69": "christianity", "70": "cockroach", "71": "coin", "72": "communication", "73": "course", "74": "crayon", "75": "creeper", "76": "deaf", "77": "detail", "78": "drunk", "79": "economical", "80": "engagement", "81": "feeling", "82": "frog", "83": "fun", "84": "future", "85": "gain", "86": "garage", "87": "garbage", "88": "gender", "89": "gift", "90": "globe", "91": "go_together", "92": "government", "93": "habit", "94": "hail", "95": "hang", "96": "haze", "97": "hello", "98": "hero", "99": "hinduism", "100": "hobby", "101": "housefly", "102": "hug", "103": "hungry", "104": "immediate", "105": "important", "106": "individual", "107": "internet", "108": "joke", "109": "judaism", "110": "king", "111": "lack", "112": "leave", "113": "level", "114": "lift", "115": "local", "116": "middle", "117": "mosquito", "118": "mouse", "119": "now", "120": "paisa", "121": "parallel", "122": "parking", "123": "past", "124": "power", "125": "prescription", "126": "process", "127": "profit", "128": "promotion", "129": "queen", "130": "query", "131": "rat", "132": "reason", "133": "record", "134": "regular", "135": "restrain", "136": "reverse", "137": "right", "138": "road", "139": "rule", "140": "rupee", "141": "service", "142": "sheep", "143": "simultaneous", "144": "situation", "145": "success", "146": "suicide", "147": "tied_up", "148": "top", "149": "tour", "150": "trip", "151": "visa", "152": "vision", "153": "voice", "154": "way", "155": "zebra_crossing", "156": "zoo" }, "image_size": 224, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "0": 0, "1": 1, "10": 10, "2": 2, "3": 3, "3g": 37, "4": 4, "4g": 38, "5": 5, "6": 6, "7": 7, "8": 8, "9": 9, "A": 11, "B": 12, "C": 13, "D": 14, "E": 15, "F": 16, "G": 17, "H": 18, "I": 19, "J": 20, "K": 21, "L": 22, "M": 23, "N": 24, "O": 25, "P": 26, "Q": 27, "R": 28, "S": 29, "T": 30, "U": 31, "V": 32, "W": 33, "X": 34, "Y": 35, "Z": 36, "accident": 39, "accompany": 40, "action": 41, "address": 42, "advantage": 43, "advertise": 44, "age": 45, "aim": 46, "alchol": 47, "alcholic": 48, "almond": 49, "app": 50, "applause": 51, "applicant": 52, "application": 53, "association": 54, "attitude": 55, "automatic": 56, "avalanche": 57, "back": 58, "background": 59, "balance": 60, "ban": 61, "bill": 62, "birth": 63, "birthday": 64, "borrow": 65, "braille": 66, "branch": 67, "cheque": 68, "christianity": 69, "cockroach": 70, "coin": 71, "communication": 72, "course": 73, "crayon": 74, "creeper": 75, "deaf": 76, "detail": 77, "drunk": 78, "economical": 79, "engagement": 80, "feeling": 81, "frog": 82, "fun": 83, "future": 84, "gain": 85, "garage": 86, "garbage": 87, "gender": 88, "gift": 89, "globe": 90, "go_together": 91, "government": 92, "habit": 93, "hail": 94, "hang": 95, "haze": 96, "hello": 97, "hero": 98, "hinduism": 99, "hobby": 100, "housefly": 101, "hug": 102, "hungry": 103, "immediate": 104, "important": 105, "individual": 106, "internet": 107, "joke": 108, "judaism": 109, "king": 110, "lack": 111, "leave": 112, "level": 113, "lift": 114, "local": 115, "middle": 116, "mosquito": 117, "mouse": 118, "now": 119, "paisa": 120, "parallel": 121, "parking": 122, "past": 123, "power": 124, "prescription": 125, "process": 126, "profit": 127, "promotion": 128, "queen": 129, "query": 130, "rat": 131, "reason": 132, "record": 133, "regular": 134, "restrain": 135, "reverse": 136, "right": 137, "road": 138, "rule": 139, "rupee": 140, "service": 141, "sheep": 142, "simultaneous": 143, "situation": 144, "success": 145, "suicide": 146, "tied_up": 147, "top": 148, "tour": 149, "trip": 150, "visa": 151, "vision": 152, "voice": 153, "way": 154, "zebra_crossing": 155, "zoo": 156 }, "layer_norm_eps": 1e-12, "model_type": "videomae", "norm_pix_loss": true, "num_attention_heads": 12, "num_channels": 3, "num_frames": 16, "num_hidden_layers": 12, "patch_size": 16, "problem_type": "single_label_classification", "qkv_bias": true, "torch_dtype": "float32", "transformers_version": "4.40.0", "tubelet_size": 2, "use_mean_pooling": false }