{ "_name_or_path": "facebook/wav2vec2-base", "activation_dropout": 0.0, "adapter_attn_dim": null, "adapter_kernel_size": 3, "adapter_stride": 2, "add_adapter": false, "apply_spec_augment": true, "architectures": [ "Wav2Vec2ForSequenceClassification" ], "attention_dropout": 0.1, "bos_token_id": 1, "classifier_proj_size": 256, "codevector_dim": 256, "contrastive_logits_temperature": 0.1, "conv_bias": false, "conv_dim": [ 512, 512, 512, 512, 512, 512, 512 ], "conv_kernel": [ 10, 3, 3, 3, 3, 2, 2 ], "conv_stride": [ 5, 2, 2, 2, 2, 2, 2 ], "ctc_loss_reduction": "sum", "ctc_zero_infinity": false, "diversity_loss_weight": 0.1, "do_stable_layer_norm": false, "eos_token_id": 2, "feat_extract_activation": "gelu", "feat_extract_norm": "group", "feat_proj_dropout": 0.1, "feat_quantizer_dropout": 0.0, "final_dropout": 0.0, "freeze_feat_extract_train": true, "hidden_act": "gelu", "hidden_dropout": 0.1, "hidden_size": 768, "id2label": { "0": "asbfly", "1": "ashdro1", "10": "bcnher", "100": "labcro1", "101": "laudov1", "102": "lblwar1", "103": "lesyel1", "104": "lewduc1", "105": "lirplo", "106": "litegr", "107": "litgre1", "108": "litspi1", "109": "litswi1", "11": "bkcbul1", "110": "lobsun2", "111": "maghor2", "112": "malpar1", "113": "maltro1", "114": "malwoo1", "115": "marsan", "116": "mawthr1", "117": "moipig1", "118": "nilfly2", "119": "niwpig1", "12": "bkrfla1", "120": "nutman", "121": "orihob2", "122": "oripip1", "123": "pabflo1", "124": "paisto1", "125": "piebus1", "126": "piekin1", "127": "placuc3", "128": "plaflo1", "129": "plapri1", "13": "bkskit1", "130": "plhpar1", "131": "pomgrp2", "132": "purher1", "133": "pursun3", "134": "pursun4", "135": "purswa3", "136": "putbab1", "137": "redspu1", "138": "rerswa1", "139": "revbul", "14": "bkwsti", "140": "rewbul", "141": "rewlap1", "142": "rocpig", "143": "rorpar", "144": "rossta2", "145": "rufbab3", "146": "ruftre2", "147": "rufwoo2", "148": "rutfly6", "149": "sbeowl1", "15": "bladro1", "150": "scamin3", "151": "shikra1", "152": "smamin1", "153": "sohmyn1", "154": "spepic1", "155": "spodov", "156": "spoowl1", "157": "sqtbul1", "158": "stbkin1", "159": "sttwoo1", "16": "blaeag1", "160": "thbwar1", "161": "tibfly3", "162": "tilwar1", "163": "vefnut1", "164": "vehpar1", "165": "wbbfly1", "166": "wemhar1", "167": "whbbul2", "168": "whbsho3", "169": "whbtre1", "17": "blakit1", "170": "whbwag1", "171": "whbwat1", "172": "whbwoo2", "173": "whcbar1", "174": "whiter2", "175": "whrmun", "176": "whtkin2", "177": "woosan", "178": "wynlau1", "179": "yebbab1", "18": "blhori1", "180": "yebbul3", "181": "zitcis1", "19": "blnmon1", "2": "ashpri1", "20": "blrwar1", "21": "bncwoo3", "22": "brakit1", "23": "brasta1", "24": "brcful1", "25": "brfowl1", "26": "brnhao1", "27": "brnshr", "28": "brodro1", "29": "brwjac1", "3": "ashwoo2", "30": "brwowl1", "31": "btbeat1", "32": "bwfshr1", "33": "categr", "34": "chbeat1", "35": "cohcuc1", "36": "comfla1", "37": "comgre", "38": "comior1", "39": "comkin1", "4": "asikoe2", "40": "commoo3", "41": "commyn", "42": "compea", "43": "comros", "44": "comsan", "45": "comtai1", "46": "copbar1", "47": "crbsun2", "48": "cregos1", "49": "crfbar1", "5": "asiope1", "50": "crseag1", "51": "dafbab1", "52": "darter2", "53": "eaywag1", "54": "emedov2", "55": "eucdov", "56": "eurbla2", "57": "eurcoo", "58": "forwag1", "59": "gargan", "6": "aspfly1", "60": "gloibi", "61": "goflea1", "62": "graher1", "63": "grbeat1", "64": "grecou1", "65": "greegr", "66": "grefla1", "67": "grehor1", "68": "grejun2", "69": "grenig1", "7": "aspswi1", "70": "grewar3", "71": "grnsan", "72": "grnwar1", "73": "grtdro1", "74": "gryfra", "75": "grynig2", "76": "grywag", "77": "gybpri1", "78": "gyhcaf1", "79": "heswoo1", "8": "barfly1", "80": "hoopoe", "81": "houcro1", "82": "houspa", "83": "inbrob1", "84": "indpit1", "85": "indrob1", "86": "indrol2", "87": "indtit1", "88": "ingori1", "89": "inpher1", "9": "barswa", "90": "insbab1", "91": "insowl1", "92": "integr", "93": "isbduc1", "94": "jerbus2", "95": "junbab2", "96": "junmyn1", "97": "junowl1", "98": "kenplo1", "99": "kerlau2" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "asbfly": "0", "ashdro1": "1", "ashpri1": "2", "ashwoo2": "3", "asikoe2": "4", "asiope1": "5", "aspfly1": "6", "aspswi1": "7", "barfly1": "8", "barswa": "9", "bcnher": "10", "bkcbul1": "11", "bkrfla1": "12", "bkskit1": "13", "bkwsti": "14", "bladro1": "15", "blaeag1": "16", "blakit1": "17", "blhori1": "18", "blnmon1": "19", "blrwar1": "20", "bncwoo3": "21", "brakit1": "22", "brasta1": "23", "brcful1": "24", "brfowl1": "25", "brnhao1": "26", "brnshr": "27", "brodro1": "28", "brwjac1": "29", "brwowl1": "30", "btbeat1": "31", "bwfshr1": "32", "categr": "33", "chbeat1": "34", "cohcuc1": "35", "comfla1": "36", "comgre": "37", "comior1": "38", "comkin1": "39", "commoo3": "40", "commyn": "41", "compea": "42", "comros": "43", "comsan": "44", "comtai1": "45", "copbar1": "46", "crbsun2": "47", "cregos1": "48", "crfbar1": "49", "crseag1": "50", "dafbab1": "51", "darter2": "52", "eaywag1": "53", "emedov2": "54", "eucdov": "55", "eurbla2": "56", "eurcoo": "57", "forwag1": "58", "gargan": "59", "gloibi": "60", "goflea1": "61", "graher1": "62", "grbeat1": "63", "grecou1": "64", "greegr": "65", "grefla1": "66", "grehor1": "67", "grejun2": "68", "grenig1": "69", "grewar3": "70", "grnsan": "71", "grnwar1": "72", "grtdro1": "73", "gryfra": "74", "grynig2": "75", "grywag": "76", "gybpri1": "77", "gyhcaf1": "78", "heswoo1": "79", "hoopoe": "80", "houcro1": "81", "houspa": "82", "inbrob1": "83", "indpit1": "84", "indrob1": "85", "indrol2": "86", "indtit1": "87", "ingori1": "88", "inpher1": "89", "insbab1": "90", "insowl1": "91", "integr": "92", "isbduc1": "93", "jerbus2": "94", "junbab2": "95", "junmyn1": "96", "junowl1": "97", "kenplo1": "98", "kerlau2": "99", "labcro1": "100", "laudov1": "101", "lblwar1": "102", "lesyel1": "103", "lewduc1": "104", "lirplo": "105", "litegr": "106", "litgre1": "107", "litspi1": "108", "litswi1": "109", "lobsun2": "110", "maghor2": "111", "malpar1": "112", "maltro1": "113", "malwoo1": "114", "marsan": "115", "mawthr1": "116", "moipig1": "117", "nilfly2": "118", "niwpig1": "119", "nutman": "120", "orihob2": "121", "oripip1": "122", "pabflo1": "123", "paisto1": "124", "piebus1": "125", "piekin1": "126", "placuc3": "127", "plaflo1": "128", "plapri1": "129", "plhpar1": "130", "pomgrp2": "131", "purher1": "132", "pursun3": "133", "pursun4": "134", "purswa3": "135", "putbab1": "136", "redspu1": "137", "rerswa1": "138", "revbul": "139", "rewbul": "140", "rewlap1": "141", "rocpig": "142", "rorpar": "143", "rossta2": "144", "rufbab3": "145", "ruftre2": "146", "rufwoo2": "147", "rutfly6": "148", "sbeowl1": "149", "scamin3": "150", "shikra1": "151", "smamin1": "152", "sohmyn1": "153", "spepic1": "154", "spodov": "155", "spoowl1": "156", "sqtbul1": "157", "stbkin1": "158", "sttwoo1": "159", "thbwar1": "160", "tibfly3": "161", "tilwar1": "162", "vefnut1": "163", "vehpar1": "164", "wbbfly1": "165", "wemhar1": "166", "whbbul2": "167", "whbsho3": "168", "whbtre1": "169", "whbwag1": "170", "whbwat1": "171", "whbwoo2": "172", "whcbar1": "173", "whiter2": "174", "whrmun": "175", "whtkin2": "176", "woosan": "177", "wynlau1": "178", "yebbab1": "179", "yebbul3": "180", "zitcis1": "181" }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_channel_length": 10, "mask_channel_min_space": 1, "mask_channel_other": 0.0, "mask_channel_prob": 0.0, "mask_channel_selection": "static", "mask_feature_length": 10, "mask_feature_min_masks": 0, "mask_feature_prob": 0.0, "mask_time_length": 10, "mask_time_min_masks": 2, "mask_time_min_space": 1, "mask_time_other": 0.0, "mask_time_prob": 0.05, "mask_time_selection": "static", "model_type": "wav2vec2", "no_mask_channel_overlap": false, "no_mask_time_overlap": false, "num_adapter_layers": 3, "num_attention_heads": 12, "num_codevector_groups": 2, "num_codevectors_per_group": 320, "num_conv_pos_embedding_groups": 16, "num_conv_pos_embeddings": 128, "num_feat_extract_layers": 7, "num_hidden_layers": 12, "num_negatives": 100, "output_hidden_size": 768, "pad_token_id": 0, "proj_codevector_dim": 256, "tdnn_dilation": [ 1, 2, 3, 1, 1 ], "tdnn_dim": [ 512, 512, 512, 512, 1500 ], "tdnn_kernel": [ 5, 3, 3, 1, 1 ], "torch_dtype": "float32", "transformers_version": "4.38.0", "use_weighted_layer_sum": false, "vocab_size": 32, "xvector_output_dim": 512 }