callmesan's picture
Training in progress, step 500
bcd10ff verified
{
"_name_or_path": "Harveenchadha/vakyansh-wav2vec2-malayalam-mlm-8",
"activation_dropout": 0.1,
"adapter_attn_dim": null,
"adapter_kernel_size": 3,
"adapter_stride": 2,
"add_adapter": false,
"apply_spec_augment": true,
"architectures": [
"Wav2Vec2ForSequenceClassification"
],
"attention_dropout": 0.1,
"bos_token": "<s>",
"bos_token_id": 0,
"classifier_proj_size": 256,
"codevector_dim": 256,
"contrastive_logits_temperature": 0.1,
"conv_bias": false,
"conv_dim": [
512,
512,
512,
512,
512,
512,
512
],
"conv_kernel": [
10,
3,
3,
3,
3,
2,
2
],
"conv_stride": [
5,
2,
2,
2,
2,
2,
2
],
"ctc_loss_reduction": "sum",
"ctc_zero_infinity": false,
"diversity_loss_weight": 0.1,
"do_lower_case": false,
"do_stable_layer_norm": false,
"eos_token": "</s>",
"eos_token_id": 2,
"feat_extract_activation": "gelu",
"feat_extract_norm": "group",
"feat_proj_dropout": 0.1,
"feat_quantizer_dropout": 0.0,
"final_dropout": 0.1,
"gradient_checkpointing": false,
"hidden_act": "gelu",
"hidden_dropout": 0.1,
"hidden_size": 768,
"id2label": {
"0": 1,
"1": 0,
"10": 0,
"100": 0,
"101": 1,
"102": 0,
"103": 1,
"104": 1,
"105": 0,
"106": 1,
"107": 1,
"108": 0,
"109": 1,
"11": 1,
"110": 0,
"111": 0,
"112": 0,
"113": 0,
"114": 0,
"115": 0,
"116": 0,
"117": 0,
"118": 0,
"119": 1,
"12": 1,
"120": 0,
"121": 0,
"122": 1,
"123": 0,
"124": 0,
"125": 1,
"126": 0,
"127": 0,
"128": 0,
"129": 0,
"13": 1,
"130": 0,
"131": 0,
"132": 1,
"133": 0,
"134": 0,
"135": 0,
"136": 0,
"137": 1,
"138": 0,
"139": 0,
"14": 0,
"140": 1,
"141": 0,
"142": 1,
"143": 0,
"144": 0,
"145": 0,
"146": 1,
"147": 0,
"148": 1,
"149": 1,
"15": 0,
"150": 0,
"151": 1,
"152": 0,
"153": 0,
"154": 0,
"155": 0,
"156": 0,
"157": 0,
"158": 0,
"159": 1,
"16": 0,
"160": 0,
"161": 1,
"162": 0,
"163": 0,
"164": 0,
"165": 1,
"166": 0,
"167": 0,
"168": 1,
"169": 0,
"17": 1,
"170": 0,
"171": 1,
"172": 0,
"173": 1,
"174": 0,
"175": 0,
"176": 0,
"177": 0,
"178": 1,
"179": 0,
"18": 0,
"180": 0,
"181": 1,
"182": 1,
"183": 1,
"184": 0,
"185": 0,
"186": 1,
"187": 0,
"188": 1,
"189": 1,
"19": 1,
"190": 1,
"191": 1,
"192": 0,
"193": 0,
"194": 1,
"195": 0,
"196": 0,
"197": 0,
"198": 1,
"199": 1,
"2": 1,
"20": 1,
"200": 1,
"201": 0,
"202": 0,
"203": 0,
"204": 0,
"205": 0,
"206": 0,
"207": 0,
"208": 0,
"209": 0,
"21": 0,
"210": 1,
"211": 1,
"212": 1,
"213": 1,
"214": 0,
"215": 1,
"216": 0,
"217": 0,
"218": 0,
"219": 0,
"22": 0,
"220": 0,
"221": 1,
"222": 0,
"223": 0,
"224": 0,
"225": 0,
"226": 0,
"227": 1,
"228": 0,
"229": 1,
"23": 0,
"230": 0,
"231": 0,
"232": 0,
"233": 0,
"234": 0,
"235": 0,
"236": 0,
"237": 0,
"238": 0,
"239": 1,
"24": 0,
"240": 0,
"241": 0,
"242": 0,
"243": 1,
"244": 0,
"245": 0,
"246": 0,
"247": 0,
"248": 0,
"249": 0,
"25": 0,
"250": 0,
"251": 0,
"252": 0,
"253": 1,
"254": 0,
"255": 1,
"256": 0,
"257": 0,
"258": 0,
"259": 0,
"26": 0,
"260": 0,
"261": 0,
"262": 0,
"263": 0,
"264": 0,
"265": 0,
"266": 0,
"267": 1,
"268": 1,
"269": 0,
"27": 1,
"270": 1,
"271": 0,
"272": 0,
"273": 0,
"274": 0,
"275": 0,
"276": 0,
"277": 0,
"278": 0,
"279": 0,
"28": 0,
"280": 1,
"281": 0,
"282": 1,
"283": 0,
"284": 0,
"285": 0,
"286": 1,
"287": 0,
"288": 0,
"289": 0,
"29": 1,
"290": 0,
"291": 0,
"292": 1,
"293": 0,
"294": 0,
"295": 0,
"296": 0,
"297": 0,
"298": 1,
"299": 1,
"3": 0,
"30": 0,
"300": 0,
"301": 0,
"302": 0,
"303": 0,
"304": 0,
"305": 0,
"306": 1,
"307": 1,
"308": 1,
"309": 0,
"31": 1,
"310": 0,
"311": 0,
"312": 0,
"313": 1,
"314": 0,
"315": 0,
"316": 0,
"317": 0,
"318": 0,
"319": 1,
"32": 0,
"320": 1,
"321": 1,
"322": 0,
"323": 0,
"324": 0,
"325": 0,
"326": 0,
"327": 1,
"328": 1,
"329": 0,
"33": 0,
"330": 0,
"331": 1,
"332": 0,
"333": 0,
"334": 0,
"335": 0,
"336": 1,
"337": 0,
"338": 1,
"339": 0,
"34": 0,
"340": 0,
"341": 0,
"342": 1,
"343": 0,
"344": 0,
"345": 0,
"346": 0,
"347": 1,
"348": 0,
"349": 0,
"35": 0,
"350": 0,
"351": 1,
"352": 0,
"353": 0,
"354": 1,
"355": 0,
"356": 0,
"357": 1,
"358": 0,
"359": 0,
"36": 0,
"360": 0,
"361": 1,
"362": 0,
"363": 0,
"364": 0,
"365": 0,
"366": 0,
"367": 0,
"368": 0,
"369": 1,
"37": 0,
"370": 0,
"371": 0,
"372": 0,
"373": 1,
"374": 0,
"375": 1,
"376": 0,
"377": 0,
"378": 1,
"379": 0,
"38": 0,
"380": 0,
"381": 1,
"382": 0,
"383": 0,
"384": 0,
"385": 0,
"386": 1,
"387": 0,
"388": 1,
"389": 1,
"39": 1,
"390": 1,
"391": 0,
"392": 0,
"393": 1,
"394": 0,
"395": 1,
"396": 0,
"397": 0,
"398": 1,
"399": 0,
"4": 1,
"40": 0,
"400": 1,
"401": 0,
"402": 1,
"403": 0,
"404": 1,
"405": 1,
"406": 0,
"407": 1,
"408": 0,
"409": 1,
"41": 0,
"410": 0,
"411": 0,
"412": 1,
"413": 0,
"414": 0,
"415": 0,
"416": 1,
"417": 0,
"418": 1,
"419": 0,
"42": 0,
"420": 0,
"421": 0,
"422": 0,
"423": 1,
"424": 0,
"425": 0,
"426": 0,
"427": 0,
"428": 1,
"429": 0,
"43": 0,
"430": 1,
"431": 0,
"432": 0,
"433": 0,
"434": 0,
"435": 0,
"436": 0,
"437": 0,
"438": 0,
"439": 0,
"44": 0,
"440": 0,
"441": 0,
"442": 0,
"443": 0,
"444": 0,
"445": 0,
"446": 0,
"447": 0,
"448": 1,
"449": 0,
"45": 0,
"450": 0,
"451": 0,
"452": 0,
"453": 0,
"454": 0,
"455": 0,
"456": 0,
"457": 0,
"458": 1,
"459": 0,
"46": 0,
"460": 1,
"461": 0,
"462": 0,
"463": 1,
"464": 0,
"465": 1,
"466": 0,
"467": 0,
"468": 0,
"469": 0,
"47": 0,
"470": 0,
"471": 0,
"472": 1,
"473": 0,
"474": 0,
"475": 1,
"476": 0,
"477": 0,
"478": 0,
"479": 0,
"48": 1,
"480": 0,
"481": 1,
"482": 0,
"483": 0,
"484": 0,
"485": 1,
"486": 0,
"487": 1,
"488": 0,
"489": 1,
"49": 0,
"490": 1,
"491": 0,
"492": 0,
"493": 1,
"494": 0,
"495": 0,
"496": 0,
"497": 1,
"498": 0,
"499": 1,
"5": 1,
"50": 1,
"500": 0,
"501": 1,
"502": 1,
"503": 0,
"504": 1,
"505": 1,
"506": 0,
"507": 0,
"508": 0,
"509": 0,
"51": 0,
"510": 0,
"511": 0,
"512": 1,
"513": 1,
"514": 0,
"515": 0,
"516": 0,
"517": 0,
"518": 1,
"519": 0,
"52": 0,
"520": 1,
"521": 0,
"522": 0,
"523": 0,
"524": 0,
"525": 0,
"526": 1,
"527": 1,
"528": 0,
"529": 0,
"53": 0,
"530": 0,
"531": 0,
"532": 0,
"533": 0,
"534": 0,
"535": 0,
"536": 0,
"537": 0,
"538": 0,
"539": 0,
"54": 0,
"540": 1,
"541": 1,
"542": 0,
"543": 1,
"544": 1,
"545": 0,
"546": 0,
"547": 0,
"548": 0,
"549": 0,
"55": 0,
"550": 1,
"551": 0,
"552": 0,
"553": 0,
"554": 0,
"555": 1,
"556": 0,
"557": 0,
"558": 1,
"559": 0,
"56": 0,
"560": 0,
"561": 1,
"562": 0,
"563": 0,
"564": 1,
"565": 1,
"566": 0,
"567": 0,
"568": 0,
"569": 0,
"57": 0,
"570": 0,
"571": 1,
"572": 0,
"573": 0,
"574": 0,
"575": 1,
"576": 0,
"577": 0,
"578": 0,
"579": 0,
"58": 0,
"580": 1,
"581": 0,
"582": 1,
"583": 0,
"584": 0,
"585": 1,
"586": 0,
"587": 1,
"588": 0,
"589": 1,
"59": 0,
"590": 0,
"591": 0,
"592": 0,
"593": 0,
"594": 0,
"595": 1,
"596": 0,
"597": 0,
"598": 1,
"599": 0,
"6": 0,
"60": 1,
"600": 1,
"601": 1,
"602": 0,
"603": 1,
"604": 0,
"605": 0,
"606": 0,
"607": 0,
"608": 1,
"609": 0,
"61": 0,
"610": 0,
"611": 0,
"612": 0,
"613": 0,
"614": 0,
"615": 0,
"616": 0,
"617": 1,
"618": 0,
"619": 0,
"62": 0,
"620": 0,
"621": 0,
"622": 0,
"623": 1,
"624": 0,
"625": 1,
"626": 0,
"627": 1,
"628": 0,
"629": 1,
"63": 0,
"630": 0,
"631": 0,
"632": 1,
"633": 0,
"634": 1,
"635": 0,
"636": 0,
"637": 0,
"638": 0,
"639": 0,
"64": 0,
"640": 0,
"641": 0,
"642": 1,
"643": 0,
"644": 0,
"645": 0,
"646": 0,
"647": 0,
"648": 0,
"649": 1,
"65": 0,
"650": 0,
"651": 1,
"652": 1,
"653": 0,
"654": 1,
"655": 0,
"656": 0,
"657": 1,
"658": 1,
"659": 1,
"66": 1,
"660": 0,
"661": 0,
"662": 0,
"663": 1,
"664": 0,
"665": 0,
"666": 0,
"667": 1,
"668": 0,
"669": 1,
"67": 0,
"670": 1,
"671": 0,
"672": 0,
"673": 0,
"674": 0,
"675": 0,
"676": 0,
"677": 0,
"678": 0,
"679": 0,
"68": 0,
"680": 0,
"681": 0,
"682": 0,
"683": 0,
"684": 0,
"685": 0,
"686": 1,
"687": 0,
"688": 0,
"689": 0,
"69": 1,
"690": 1,
"691": 0,
"692": 0,
"693": 0,
"694": 0,
"695": 1,
"696": 0,
"697": 0,
"698": 0,
"699": 1,
"7": 0,
"70": 0,
"700": 0,
"701": 1,
"702": 0,
"703": 0,
"704": 0,
"705": 0,
"706": 0,
"707": 0,
"708": 1,
"709": 0,
"71": 0,
"710": 0,
"711": 0,
"712": 0,
"713": 0,
"714": 0,
"715": 0,
"716": 0,
"717": 1,
"718": 0,
"719": 1,
"72": 0,
"720": 0,
"721": 0,
"722": 0,
"723": 0,
"724": 0,
"725": 0,
"726": 1,
"727": 0,
"728": 0,
"729": 0,
"73": 1,
"730": 0,
"731": 0,
"732": 0,
"733": 0,
"734": 1,
"735": 0,
"736": 1,
"737": 0,
"738": 0,
"739": 0,
"74": 1,
"740": 1,
"741": 0,
"742": 1,
"743": 0,
"744": 0,
"745": 0,
"746": 1,
"747": 1,
"748": 0,
"749": 0,
"75": 1,
"750": 1,
"751": 1,
"752": 0,
"753": 1,
"754": 0,
"755": 0,
"756": 1,
"757": 1,
"758": 0,
"759": 0,
"76": 0,
"760": 1,
"761": 0,
"762": 0,
"763": 0,
"764": 0,
"765": 1,
"766": 0,
"767": 0,
"768": 1,
"769": 0,
"77": 0,
"770": 0,
"771": 0,
"772": 1,
"773": 0,
"774": 0,
"775": 0,
"776": 0,
"777": 0,
"778": 0,
"779": 0,
"78": 0,
"780": 0,
"781": 0,
"782": 0,
"783": 0,
"784": 0,
"785": 1,
"786": 0,
"787": 0,
"788": 0,
"789": 0,
"79": 1,
"790": 0,
"791": 1,
"792": 1,
"793": 0,
"794": 0,
"795": 0,
"796": 0,
"797": 0,
"798": 0,
"799": 1,
"8": 1,
"80": 0,
"800": 1,
"801": 1,
"802": 0,
"803": 0,
"804": 0,
"805": 1,
"806": 1,
"807": 0,
"808": 1,
"809": 0,
"81": 1,
"810": 1,
"811": 0,
"812": 0,
"813": 1,
"814": 1,
"815": 1,
"816": 0,
"817": 1,
"818": 0,
"82": 1,
"83": 0,
"84": 0,
"85": 0,
"86": 1,
"87": 1,
"88": 0,
"89": 0,
"9": 1,
"90": 0,
"91": 0,
"92": 0,
"93": 1,
"94": 1,
"95": 1,
"96": 0,
"97": 1,
"98": 0,
"99": 0
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"0": "818",
"1": "817"
},
"layer_norm_eps": 1e-05,
"layerdrop": 0.1,
"mask_feature_length": 10,
"mask_feature_min_masks": 0,
"mask_feature_prob": 0.0,
"mask_time_length": 10,
"mask_time_min_masks": 2,
"mask_time_prob": 0.05,
"model_type": "wav2vec2",
"num_adapter_layers": 3,
"num_attention_heads": 12,
"num_codevector_groups": 2,
"num_codevectors_per_group": 320,
"num_conv_pos_embedding_groups": 16,
"num_conv_pos_embeddings": 128,
"num_feat_extract_layers": 7,
"num_hidden_layers": 12,
"num_negatives": 100,
"output_hidden_size": 768,
"pad_token": "[PAD]",
"pad_token_id": 1,
"proj_codevector_dim": 256,
"tdnn_dilation": [
1,
2,
3,
1,
1
],
"tdnn_dim": [
512,
512,
512,
512,
1500
],
"tdnn_kernel": [
5,
3,
3,
1,
1
],
"torch_dtype": "float32",
"transformers_version": "4.33.0",
"unk_token": "[UNK]",
"use_weighted_layer_sum": false,
"vocab_size": 72,
"word_delimiter_token": "|",
"xvector_output_dim": 512
}