models: - model: deepseek-ai/DeepSeek-R1-0528-Qwen3-8B parameters: weight: 1 - model: Qwen/Qwen3-8B parameters: weight: 0 merge_method: linear base_model: deepseek-ai/DeepSeek-R1-0528-Qwen3-8B parameters: normalize: false tokenizer: source: "Qwen/Qwen3-8B" tokens: <|endoftext|>: source: "Qwen/Qwen3-8B" <|im_end|>: source: "Qwen/Qwen3-8B" <|end▁of▁sentence|>: source: model: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B" kind: "model_token" token: "<|end▁of▁sentence|>" force: true <|User|>: source: model: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B" kind: "model_token" token: "<|User|>" force: true <|Assistant|>: source: model: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B" kind: "model_token" token: "<|Assistant|>" force: true <|begin▁of▁sentence|>: source: model: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B" kind: "model_token" token: "<|begin▁of▁sentence|>" force: true dtype: bfloat16