mergekit-ties-isswcgh / mergekit_config.yml
wassemgtk's picture
Upload folder using huggingface_hub
79f0d12 verified
merge_method: ties
base_model: deepcogito/cogito-v1-preview-qwen-14B # Or Qwen2.5, experiment maybe
dtype: bfloat16 # Or float16 if bf16 not well supported
models:
- model: deepcogito/cogito-v1-preview-qwen-14B
# Parameters for TIES - density controls sparsity, weight influences importance
parameters:
density: 0.6 # Start around 0.5-0.7, higher keeps more parameters
weight: 0.6 # Slightly favor cogito for performance
- model: Qwen/Qwen2.5-14B-Instruct-1M
parameters:
density: 0.6 # Keep density consistent usually
weight: 0.4 # Give less weight but allow its parameters to win conflicts where strong