models: | |
- model: Zhihu-ai/Zhi-writing-dsr1-14b | |
- model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | |
- model: huihui-ai/Qwen2.5-14B-Instruct-1M-abliterated | |
- model: huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2 | |
- model: mergekit-community/Qwen2.5-14B-della-code | |
- model: Qwen/Qwen2.5-14B-Instruct-1M | |
- model: SicariusSicariiStuff/Impish_QWEN_14B-1M | |
- model: tanliboy/lambda-qwen2.5-14b-dpo-test | |
merge_method: karcher | |
base_model: Qwen/Qwen2.5-14B-Instruct | |
parameters: | |
max_iter: 1000 | |
normalize: true | |
int8_mask: true | |
tokenizer_source: base | |
dtype: float16 |