li-14b-v0.4-slerp0.1
10
7
14.0B
—
by
wanlige
Language Model
OTHER
14B params
New
10 downloads
Early-stage
Edge AI:
Mobile
Laptop
Server
32GB+ RAM
Mobile
Laptop
Server
Quick Summary
AI model with specialized capabilities.
Device Compatibility
Mobile
4-6GB RAM
Laptop
16GB RAM
Server
GPU
Minimum Recommended
14GB+ RAM
Code Examples
Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Configurationyaml
# merge_method: arcee_fusion
# base_model: wanlige/li-14b-v0.4
# tokenizer_source: base
# parameters:
# int8_mask: true
# normalize: true
# rescale: false
# dtype: bfloat16
# out_dtype: bfloat16
# models:
# - model: sthenno-com/miscii-14b-0218
base_model: wanlige/li-14b-v0.4
merge_method: slerp
tokenizer_source: base
dtype: float32
out_dtype: bfloat16
parameters:
t:
- filter: self_attn
value: [ 0.00, 0.50, 0.30, 0.70, 1.00 ]
- filter: mlp
value: [ 1.00, 0.50, 0.70, 0.30, 0.00 ]
- value: [ 0.00, 0.00, 0.00, 0.00, 0.04, 0.08, 0.12, 0.16, 0.24, 0.32, 0.40, 0.48, 0.56, 0.64, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.72, 0.64, 0.56, 0.48 ]
slices:
- sources:
- model: wanlige/li-14b-v0.4
layer_range: [ 0, 48 ]
- model: sthenno-com/miscii-14b-0218
layer_range: [ 0, 48 ]Deploy This Model
Production-ready deployment in minutes
Together.ai
Instant API access to this model
Production-ready inference API. Start free, scale to millions.
Try Free APIReplicate
One-click model deployment
Run models in the cloud with simple API. No DevOps required.
Deploy NowDisclosure: We may earn a commission from these partners. This helps keep LLMYourWay free.