File size: 1,215 Bytes
aebdeb1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 |
models:
- model: NousResearch/Meta-Llama-3-8B
# Base model providing a general foundation without specific parameters
- model: NousResearch/Meta-Llama-3-8B-Instruct
parameters:
density: 0.60 # Increased density to emphasize instruction-based features
weight: 0.25 # Reduced weight to balance total sum
- model: winglian/llama-3-8b-256k-PoSE
parameters:
density: 0.60 # Emphasizing extended context handling
weight: 0.20 # Adjusted to balance the total weight sum
- model: Locutusque/Llama-3-Orca-1.0-8B
parameters:
density: 0.55 # Standard density for effective integration
weight: 0.15 # Reduced weight to allocate more to critical models
- model: abacusai/Llama-3-Smaug-8B
parameters:
density: 0.55 # Consistent density for uniform behavior
weight: 0.15 # Reduced weight for balance and efficiency
- model: beomi/Llama-3-Open-Ko-8B-Instruct-preview
parameters:
density: 0.55 # Adjusted density to fit within the ensemble
weight: 0.30 # Increased weight to emphasize this Korean-based model
merge_method: dare_ties
base_model: NousResearch/Meta-Llama-3-8B
parameters:
int8_mask: true
dtype: bfloat16
|