Aqueducts-18B / recipe.yml
MarsupialAI's picture
Upload recipe.yml
b02a8ec verified
models:
- model: NousResearch/Nous-Hermes-2-SOLAR-10.7B
parameters:
weight: 1.0
- model: upstage/SOLAR-10.7B-v1.0
base_model: upstage/SOLAR-10.7B-v1.0
merge_method: task_arithmetic
dtype: float16
name: FlatSolarHermes
---
models:
- model: Sao10K/Frostwind-10.7B-v1
parameters:
weight: [1, 1, 1, 0.875, 0.75, 0.625, 0.5, 0.375, 0.25, 0.125, 0, 0, 0]
- model: FlatSolarHermes
parameters:
weight: [0, 0, 0, 0.125, 0.25, 0.375, 0.5, 0.625, 0.75, 0.875, 1, 1, 1]
merge_method: linear
dtype: float16
name: MidpointSlow
---
slices:
- sources:
- model: FlatSolarHermes
layer_range: [0, 32]
- sources:
- model: MidpointSlow
layer_range: [16, 32]
- sources:
- model: Sao10K/Frostwind-10.7B-v1
layer_range: [16, 48]
merge_method: passthrough
dtype: float16
name: MoreOrig
---
slices:
- sources:
- model: FlatSolarHermes
layer_range: [0, 24]
- sources:
- model: MidpointSlow
layer_range: [8, 40]
- sources:
- model: Sao10K/Frostwind-10.7B-v1
layer_range: [24, 48]
merge_method: passthrough
dtype: float16
name: LessOrig
---
models:
- model: MoreOrig
parameters:
weight: [1, 1, 1, 1, 1, 1, 1, 0.75, 0, 0, 0, 0, 0, 0.75, 1, 1, 1, 1, 1, 1, 1]
- model: LessOrig
parameters:
weight: [0, 0, 0, 0, 0, 0, 0, 0.25, 1, 1, 1, 1, 1, 0.25, 0, 0, 0, 0, 0, 0, 0]
merge_method: linear
dtype: float16
name: CircusesTemp
---
slices:
- sources:
- model: Sao10K/Frostwind-10.7B-v1
layer_range: [0, 8]
- sources:
- model: Sao10K/Frostwind-10.7B-v1
layer_range: [40, 48]
merge_method: passthrough
dtype: float16
name: FWShell
---
slices:
- sources:
- model: FlatSolarHermes
layer_range: [0, 8]
- sources:
- model: FlatSolarHermes
layer_range: [40, 48]
merge_method: passthrough
dtype: float16
name: SHShell
---
models:
- model: FWShell
parameters:
weight: 0.5
- model: SHShell
parameters:
weight: 0.5
merge_method: linear
dtype: float16
name: LowerShellL
---
slices:
- sources:
- model: LowerShellL
layer_range: [0, 8]
- sources:
- model: CircusesTemp
layer_range: [8, 72]
- sources:
- model: LowerShellL
layer_range: [8, 16]
merge_method: passthrough
dtype: float16
name: Circuses
---
models:
- model: upstage/SOLAR-10.7B-Instruct-v1.0+NyxKrage/Solar-Doc-10.7B-Lora
parameters:
weight: 0.01
merge_method: task_arithmetic
base_model: upstage/SOLAR-10.7B-Instruct-v1.0
dtype: float16
name: LostMyLicenseAgain
---
slices:
- sources:
- model: LostMyLicenseAgain
layer_range: [0, 8]
- sources:
- model: LostMyLicenseAgain
layer_range: [40, 48]
merge_method: passthrough
dtype: float16
name: LMLShell
---
slices:
- sources:
- model: KoboldAI/Mistral-7B-Erebus-v3
layer_range: [0, 8]
- sources:
- model: KoboldAI/Mistral-7B-Erebus-v3
layer_range: [24, 32]
merge_method: passthrough
dtype: float16
name: EShell
---
slices:
- sources:
- model: KoboldAI/Mistral-7B-Holodeck-1
layer_range: [0, 8]
- sources:
- model: KoboldAI/Mistral-7B-Holodeck-1
layer_range: [24, 32]
merge_method: passthrough
dtype: float16
name: HShell
---
models:
- model: LMLShell
parameters:
weight: 2.1
- model: EShell
parameters:
weight: 0.55
- model: HShell
parameters:
weight: 0.55
merge_method: linear
dtype: float16
name: UpperShellBell
---
slices:
- sources:
- model: LostMyLicenseAgain
layer_range: [0, 32]
- sources:
- model: KoboldAI/Mistral-7B-Holodeck-1
layer_range: [16, 24]
- sources:
- model: KoboldAI/Mistral-7B-Erebus-v3
layer_range: [8, 16]
- sources:
- model: LostMyLicenseAgain
layer_range: [16, 48]
merge_method: passthrough
dtype: float16
name: MoreLicense
---
slices:
- sources:
- model: LostMyLicenseAgain
layer_range: [0, 24]
- sources:
- model: KoboldAI/Mistral-7B-Holodeck-1
layer_range: [8, 24]
- sources:
- model: KoboldAI/Mistral-7B-Erebus-v3
layer_range: [8, 24]
- sources:
- model: LostMyLicenseAgain
layer_range: [24, 48]
merge_method: passthrough
dtype: float16
name: LessLicense
---
models:
- model: MoreLicense
parameters:
weight: [1, 1, 1, 1, 1, 1, 1, 0.75, 0, 0, 0, 0, 0, 0.75, 1, 1, 1, 1, 1, 1, 1]
- model: LessLicense
parameters:
weight: [0, 0, 0, 0, 0, 0, 0, 0.25, 1, 1, 1, 1, 1, 0.25, 0, 0, 0, 0, 0, 0, 0]
merge_method: linear
dtype: float16
name: ThermaeTemp
---
slices:
- sources:
- model: UpperShellBell
layer_range: [0, 8]
- sources:
- model: ThermaeTemp
layer_range: [8, 72]
- sources:
- model: UpperShellBell
layer_range: [8, 16]
merge_method: passthrough
dtype: float16
name: Thermae
---
models:
- model: Thermae
parameters:
weight: 0.5
- model: Circuses
parameters:
weight: 0.5
merge_method: linear
dtype: float16