Kosmos-EVAA-Franken-v36-8B

2
2
llama
by
jaspionjader
Language Model
OTHER
8B params
New
2 downloads
Early-stage
Edge AI:
Mobile
Laptop
Server
18GB+ RAM
Mobile
Laptop
Server
Quick Summary

This is a merge of pre-trained language models created using mergekit.

Device Compatibility

Mobile
4-6GB RAM
Laptop
16GB RAM
Server
GPU
Minimum Recommended
8GB+ RAM

Code Examples

Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16
Configurationyaml
slices:
- sources:
  - model: jaspionjader/f-5-8b
    layer_range:
    - 0
    - 32
  - model: jaspionjader/f-8-8b
    layer_range:
    - 0
    - 32
merge_method: slerp
base_model: jaspionjader/f-5-8b
parameters:
  t:
  - filter: self_attn
    value:
    - 0.2
    - 0.4
    - 0.1
    - 0.6
    - 0.8
  - filter: mlp
    value:
    - 0.8
    - 0.6
    - 0.9
    - 0.4
    - 0.2
  - value: 0.5
dtype: bfloat16

Deploy This Model

Production-ready deployment in minutes

Together.ai

Instant API access to this model

Fastest API

Production-ready inference API. Start free, scale to millions.

Try Free API

Replicate

One-click model deployment

Easiest Setup

Run models in the cloud with simple API. No DevOps required.

Deploy Now

Disclosure: We may earn a commission from these partners. This helps keep LLMYourWay free.