Update README.md
Browse files
README.md
CHANGED
@@ -68,11 +68,11 @@ slices:
|
|
68 |
- model: ./Qwen3-32B-Upscaled
|
69 |
layer_range: [0, 32]
|
70 |
parameters:
|
71 |
-
weight: 0.
|
72 |
- model: ./Qwen2.5-72B-Instruct-Aligned
|
73 |
layer_range: [0, 32]
|
74 |
parameters:
|
75 |
-
weight: 0.
|
76 |
|
77 |
# Slice 2: The "Knowledge Bridge" - transplant a pure block from the donor
|
78 |
- merge_method: passthrough
|
@@ -86,11 +86,11 @@ slices:
|
|
86 |
- model: ./Qwen3-32B-Upscaled
|
87 |
layer_range: [32, 64]
|
88 |
parameters:
|
89 |
-
weight: 0.
|
90 |
- model: ./Qwen2.5-72B-Instruct-Aligned
|
91 |
layer_range: [48, 80]
|
92 |
parameters:
|
93 |
-
weight: 0.
|
94 |
|
95 |
tokenizer_source: ./Qwen3-32B-Upscaled
|
96 |
```
|
|
|
68 |
- model: ./Qwen3-32B-Upscaled
|
69 |
layer_range: [0, 32]
|
70 |
parameters:
|
71 |
+
weight: 0.5
|
72 |
- model: ./Qwen2.5-72B-Instruct-Aligned
|
73 |
layer_range: [0, 32]
|
74 |
parameters:
|
75 |
+
weight: 0.5
|
76 |
|
77 |
# Slice 2: The "Knowledge Bridge" - transplant a pure block from the donor
|
78 |
- merge_method: passthrough
|
|
|
86 |
- model: ./Qwen3-32B-Upscaled
|
87 |
layer_range: [32, 64]
|
88 |
parameters:
|
89 |
+
weight: 0.5
|
90 |
- model: ./Qwen2.5-72B-Instruct-Aligned
|
91 |
layer_range: [48, 80]
|
92 |
parameters:
|
93 |
+
weight: 0.5
|
94 |
|
95 |
tokenizer_source: ./Qwen3-32B-Upscaled
|
96 |
```
|