| models: | |
| - model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | |
| - model: qihoo360/Light-R1-14B-DS | |
| - model: arcee-ai/Virtuoso-Small-v2 | |
| - model: Qwen/Qwen2.5-14B-Instruct | |
| - model: YOYO-AI/Qwen2.5-Coder-14B-YOYO-1010 | |
| - model: Qwen/Qwen2.5-14B-Instruct-1M | |
| - model: tanliboy/lambda-qwen2.5-14b-dpo-test | |
| merge_method: model_stock | |
| base_model: Qwen/Qwen2.5-14B-Instruct | |
| tokenizer_source: base | |
| normalize: true | |
| int8_mask: true | |
| dtype: bfloat16 |