|
|
|
base_model: ehristoforu/Qwen2-1.5b-it-chat |
|
architecture: qwen |
|
gate_mode: hidden |
|
dtype: bfloat16 |
|
experts: |
|
- source_model: ehristoforu/Qwen2-1.5b-it-chat |
|
positive_prompts: ["chat", "assistant", "chat history", "chat context", "writing", "text writing", "editing", "text editing", "multilingual"] |
|
- source_model: ehristoforu/Qwen2-1.5b-it-bioinstruct |
|
positive_prompts: ["bio", "science", "biology", "natural sciences", "scientist"] |
|
- source_model: ehristoforu/Qwen2-1.5b-it-codealpaca |
|
positive_prompts: ["code", "coding", "coder", "programming", "programmer", "code analysis", "code review", "code fix", "code improvement"] |
|
- source_model: ehristoforu/Qwen2-1.5b-it-math |
|
positive_prompts: ["math", "mathematician", "problem solving", "calculating", "logics"] |
|
shared_experts: |
|
- source_model: ehristoforu/Qwen2-1.5b-it-chat |
|
positive_prompts: |
|
- "chat assistant" |
|
|
|
residual_scale: 0.1 |
|
|
|
|