models: | |
- model: Zhihu-ai/Zhi-writing-dsr1-14b | |
- model: agentica-org/DeepCoder-14B-Preview | |
- model: mergekit-community/Qwen2.5-14B-della-code | |
- model: mergekit-community/Qwen2.5-14B-della-v2-dpo | |
- model: mergekit-community/Qwen2.5-14B-della-V6-dpo | |
- model: mergekit-community/Qwen2.5-14B-della-Nova-dpo | |
- model: mergekit-community/Qwen2.5-14B-della-base-dpo | |
- model: mergekit-community/Qwen2.5-14B-della-1M-dpo | |
merge_method: karcher | |
base_model: mergekit-community/Qwen2.5-14B-della-1M-dpo | |
parameters: | |
max_iter: 1000 | |
tokenizer_source: base | |
dtype: float16 | |
int8_mask: true | |
normalize: true |