Update README.md
Browse files
README.md
CHANGED
@@ -53,6 +53,47 @@ I first made passthrough merges of the models listed above into separate parts t
|
|
53 |
|
54 |
### Configs
|
55 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
56 |
```yaml
|
57 |
models:
|
58 |
- model: parts/summanus.ds.9b
|
@@ -68,5 +109,4 @@ parameters:
|
|
68 |
normalize: true
|
69 |
int8_mask: true
|
70 |
dtype: bfloat16
|
71 |
-
|
72 |
```
|
|
|
53 |
|
54 |
### Configs
|
55 |
|
56 |
+
summanus.ds.9b:
|
57 |
+
```yaml
|
58 |
+
models:
|
59 |
+
slices:
|
60 |
+
- sources:
|
61 |
+
- layer_range: [0, 28]
|
62 |
+
model: kromeurus/L3-Blackfall-Summanus-v0.1-15B
|
63 |
+
- sources:
|
64 |
+
- layer_range: [56, 64]
|
65 |
+
model: kromeurus/L3-Blackfall-Summanus-v0.1-15B
|
66 |
+
parameters:
|
67 |
+
int8_mask: true
|
68 |
+
merge_method: passthrough
|
69 |
+
dtype: bfloat16
|
70 |
+
```
|
71 |
+
summanusara.atp1:
|
72 |
+
```yaml
|
73 |
+
models:
|
74 |
+
slices:
|
75 |
+
- sources:
|
76 |
+
- layer_range: [0, 8]
|
77 |
+
model: crestf411/L3-8B-sunfall-v0.4-stheno-v3.2
|
78 |
+
- sources:
|
79 |
+
- layer_range: [8, 16]
|
80 |
+
model: TheDrummer/Llama-3SOME-8B-v2
|
81 |
+
- sources:
|
82 |
+
- layer_range: [16, 24]
|
83 |
+
model: Hastagaras/Jamet-8B-L3-MK.V-Blackroot
|
84 |
+
- sources:
|
85 |
+
- layer_range: [22, 26]
|
86 |
+
model: TheDrummer/Llama-3SOME-8B-v2
|
87 |
+
- sources:
|
88 |
+
- layer_range: [24, 32]
|
89 |
+
model: crestf411/L3-8B-sunfall-v0.4-stheno-v3.2
|
90 |
+
parameters:
|
91 |
+
int8_mask: true
|
92 |
+
merge_method: passthrough
|
93 |
+
dtype: bfloat16
|
94 |
+
```
|
95 |
+
|
96 |
+
final:
|
97 |
```yaml
|
98 |
models:
|
99 |
- model: parts/summanus.ds.9b
|
|
|
109 |
normalize: true
|
110 |
int8_mask: true
|
111 |
dtype: bfloat16
|
|
|
112 |
```
|