File size: 1,684 Bytes
4c2ac8f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 |
# slices:
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [0, 28]
######## [0, 28] Is good because layer 28 does nothing when removed
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [29, 32]
# slices:
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [0, 27]
# ####### [0, 27] Is good because layer 27 does nothing when removed
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [28, 32]
# slices:
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [0, 26]
# ####### [0, 26] Is good because layer 26 does nothing when removed
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [27, 32]
# slices:
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [0, 25]
# ####### [0, 25] Is good because layer 25 does nothing when removed
# - sources:
# - model: TroyDoesAI/Mermaid-Llama-3-8B
# layer_range: [26, 32]
slices:
- sources:
- model: TroyDoesAI/Mermaid-Llama-3-8B
layer_range: [0, 25]
- sources:
- model: TroyDoesAI/Mermaid-Llama-3-8B
layer_range: [26, 27]
- sources:
- model: TroyDoesAI/Mermaid-Llama-3-8B
layer_range: [29, 32]
# layer 31 / 32 is syntax layer around middle of output extra > for edges
# Layer 29 is syntax layer around middle of input for semi colon and colon mixup
# TODO: Layer 28 Does NOTHING
# Layer 27 Does NOTHING
# Layer 26 Does NOTHING
# Layer 25 Does NOTHING
merge_method: passthrough
dtype: float16
|