|
{ |
|
"auto_map":{ |
|
"AutoConfig": "gigaam_transformers.GigaAMConfig", |
|
"AutoModel": "gigaam_transformers.GigaAMRNNTHF", |
|
"AutoModelForSpeechSeq2Seq": "gigaam_transformers.GigaAMRNNTHF", |
|
"AutoProcessor": "gigaam_transformers.GigaAMProcessor", |
|
"AutoTokenizer": "gigaam_transformers.GigaAMTokenizer", |
|
"AutoFeatureExtractor": "gigaam_transformers.GigaAMFeatureExtractor" |
|
}, |
|
|
|
"encoder": { |
|
"feat_in": 64, |
|
"n_layers": 16, |
|
"d_model": 768, |
|
"subsampling_factor": 4, |
|
"ff_expansion_factor": 4, |
|
"self_attention_model": "rotary", |
|
"pos_emb_max_len": 5000, |
|
"n_heads": 16, |
|
"conv_kernel_size": 31, |
|
"flash_attn": false |
|
}, |
|
"head": { |
|
"decoder": { |
|
"pred_hidden": 320, |
|
"pred_rnn_layers": 1, |
|
"num_classes": 34 |
|
}, |
|
"joint": { |
|
"enc_hidden": 768, |
|
"pred_hidden": 320, |
|
"joint_hidden": 320, |
|
"num_classes": 34 |
|
} |
|
}, |
|
"labels": [ |
|
" ", |
|
"а", |
|
"б", |
|
"в", |
|
"г", |
|
"д", |
|
"е", |
|
"ж", |
|
"з", |
|
"и", |
|
"й", |
|
"к", |
|
"л", |
|
"м", |
|
"н", |
|
"о", |
|
"п", |
|
"р", |
|
"с", |
|
"т", |
|
"у", |
|
"ф", |
|
"х", |
|
"ц", |
|
"ч", |
|
"ш", |
|
"щ", |
|
"ъ", |
|
"ы", |
|
"ь", |
|
"э", |
|
"ю", |
|
"я" |
|
], |
|
"blank_id": 33, |
|
"pad_token_id": 33, |
|
"max_symbols": 1000, |
|
"model_type": "gigaam-rnnt" |
|
} |