|
models:
|
|
- model: NousResearch/Nous-Hermes-2-SOLAR-10.7B
|
|
parameters:
|
|
weight: 1.0
|
|
- model: upstage/SOLAR-10.7B-v1.0
|
|
base_model: upstage/SOLAR-10.7B-v1.0
|
|
merge_method: task_arithmetic
|
|
dtype: float16
|
|
name: FlatSolarHermes
|
|
---
|
|
|
|
|
|
models:
|
|
- model: Sao10K/Frostwind-10.7B-v1
|
|
parameters:
|
|
weight: [1, 1, 1, 0.875, 0.75, 0.625, 0.5, 0.375, 0.25, 0.125, 0, 0, 0]
|
|
- model: FlatSolarHermes
|
|
parameters:
|
|
weight: [0, 0, 0, 0.125, 0.25, 0.375, 0.5, 0.625, 0.75, 0.875, 1, 1, 1]
|
|
merge_method: linear
|
|
dtype: float16
|
|
name: MidpointSlow
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: FlatSolarHermes
|
|
layer_range: [0, 32]
|
|
- sources:
|
|
- model: MidpointSlow
|
|
layer_range: [16, 32]
|
|
- sources:
|
|
- model: Sao10K/Frostwind-10.7B-v1
|
|
layer_range: [16, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: MoreOrig
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: FlatSolarHermes
|
|
layer_range: [0, 24]
|
|
- sources:
|
|
- model: MidpointSlow
|
|
layer_range: [8, 40]
|
|
- sources:
|
|
- model: Sao10K/Frostwind-10.7B-v1
|
|
layer_range: [24, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: LessOrig
|
|
---
|
|
|
|
models:
|
|
- model: MoreOrig
|
|
parameters:
|
|
weight: [1, 1, 1, 1, 1, 1, 1, 0.75, 0, 0, 0, 0, 0, 0.75, 1, 1, 1, 1, 1, 1, 1]
|
|
- model: LessOrig
|
|
parameters:
|
|
weight: [0, 0, 0, 0, 0, 0, 0, 0.25, 1, 1, 1, 1, 1, 0.25, 0, 0, 0, 0, 0, 0, 0]
|
|
merge_method: linear
|
|
dtype: float16
|
|
name: CircusesTemp
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: Sao10K/Frostwind-10.7B-v1
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: Sao10K/Frostwind-10.7B-v1
|
|
layer_range: [40, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: FWShell
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: FlatSolarHermes
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: FlatSolarHermes
|
|
layer_range: [40, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: SHShell
|
|
---
|
|
|
|
models:
|
|
- model: FWShell
|
|
parameters:
|
|
weight: 0.5
|
|
- model: SHShell
|
|
parameters:
|
|
weight: 0.5
|
|
merge_method: linear
|
|
dtype: float16
|
|
name: LowerShellL
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: LowerShellL
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: CircusesTemp
|
|
layer_range: [8, 72]
|
|
- sources:
|
|
- model: LowerShellL
|
|
layer_range: [8, 16]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: Circuses
|
|
---
|
|
models:
|
|
- model: upstage/SOLAR-10.7B-Instruct-v1.0+NyxKrage/Solar-Doc-10.7B-Lora
|
|
parameters:
|
|
weight: 0.01
|
|
merge_method: task_arithmetic
|
|
base_model: upstage/SOLAR-10.7B-Instruct-v1.0
|
|
dtype: float16
|
|
name: LostMyLicenseAgain
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: LostMyLicenseAgain
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: LostMyLicenseAgain
|
|
layer_range: [40, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: LMLShell
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Erebus-v3
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Erebus-v3
|
|
layer_range: [24, 32]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: EShell
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Holodeck-1
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Holodeck-1
|
|
layer_range: [24, 32]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: HShell
|
|
---
|
|
|
|
models:
|
|
- model: LMLShell
|
|
parameters:
|
|
weight: 2.1
|
|
- model: EShell
|
|
parameters:
|
|
weight: 0.55
|
|
- model: HShell
|
|
parameters:
|
|
weight: 0.55
|
|
merge_method: linear
|
|
dtype: float16
|
|
name: UpperShellBell
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: LostMyLicenseAgain
|
|
layer_range: [0, 32]
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Holodeck-1
|
|
layer_range: [16, 24]
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Erebus-v3
|
|
layer_range: [8, 16]
|
|
- sources:
|
|
- model: LostMyLicenseAgain
|
|
layer_range: [16, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: MoreLicense
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: LostMyLicenseAgain
|
|
layer_range: [0, 24]
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Holodeck-1
|
|
layer_range: [8, 24]
|
|
- sources:
|
|
- model: KoboldAI/Mistral-7B-Erebus-v3
|
|
layer_range: [8, 24]
|
|
- sources:
|
|
- model: LostMyLicenseAgain
|
|
layer_range: [24, 48]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: LessLicense
|
|
---
|
|
|
|
models:
|
|
- model: MoreLicense
|
|
parameters:
|
|
weight: [1, 1, 1, 1, 1, 1, 1, 0.75, 0, 0, 0, 0, 0, 0.75, 1, 1, 1, 1, 1, 1, 1]
|
|
- model: LessLicense
|
|
parameters:
|
|
weight: [0, 0, 0, 0, 0, 0, 0, 0.25, 1, 1, 1, 1, 1, 0.25, 0, 0, 0, 0, 0, 0, 0]
|
|
merge_method: linear
|
|
dtype: float16
|
|
name: ThermaeTemp
|
|
---
|
|
|
|
slices:
|
|
- sources:
|
|
- model: UpperShellBell
|
|
layer_range: [0, 8]
|
|
- sources:
|
|
- model: ThermaeTemp
|
|
layer_range: [8, 72]
|
|
- sources:
|
|
- model: UpperShellBell
|
|
layer_range: [8, 16]
|
|
merge_method: passthrough
|
|
dtype: float16
|
|
name: Thermae
|
|
---
|
|
models:
|
|
- model: Thermae
|
|
parameters:
|
|
weight: 0.5
|
|
- model: Circuses
|
|
parameters:
|
|
weight: 0.5
|
|
merge_method: linear
|
|
dtype: float16 |