{ | |
"model_id": "smallthinker_500m", | |
"model_arch": "qwen2", | |
"version": 20241202, | |
"llm_config": { | |
"embed_dim": 896, | |
"ffn_dim": 4864, | |
"head_size": 64, | |
"kv_dim": 128, | |
"n_attn_heads": 14, | |
"n_attn_kv_heads": 2, | |
"n_ctx": 32768, | |
"n_layers": 24, | |
"norm_eps": 9.999999974752427e-07, | |
"vocab_size": 151936, | |
"rope_config": { | |
"n_rope_ctx_orig": 32768, | |
"rope_attn_factor": 1.0, | |
"rope_dim": 64, | |
"rope_freq_base": 1000000.0, | |
"rope_freq_scale": 1.0, | |
"rope_scale_type": "linear", | |
"rope_type": -1 | |
} | |
}, | |
"vision": {} | |
} |