out_dtype: bfloat16 | |
merge_method: model_stock | |
base_model: mergekit-community/L3.1-Athena-c-8B | |
models: | |
- model: meta-llama/Llama-3.1-8B | |
- model: meta-llama/Llama-3.1-8B-Instruct | |
- model: Skywork/Skywork-o1-Open-Llama-3.1-8B | |
- model: Skywork/Skywork-Critic-Llama-3.1-8B | |
- model: MathGenie/MathCoder2-Llama-3-8B | |
- model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B | |
- model: DavidAU/DeepSeek-BlackRoot-R1-Distill-Llama-3.1-8B | |
- model: mergekit-community/L3.1-Athena-b-8B |