models: - model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B - model: Qwen/Qwen2.5-14B-Instruct parameters: weight: 1 density: 1 merge_method: ties base_model: Qwen/Qwen2.5-14B-Instruct-1M parameters: weight: 1 density: 1 normalize: true int8_mask: true dtype: bfloat16