Update README.md
#1
by
Isotonic
- opened
README.md
CHANGED
@@ -35,6 +35,6 @@ merge_method: slerp
|
|
35 |
base_model: nvidia/Llama-3.1-Nemotron-8B-UltraLong-4M-Instruct
|
36 |
dtype: bfloat16
|
37 |
parameters:
|
38 |
-
t: [0, 0.5, 1, 0.5, 0] # V shaped curve:
|
39 |
|
40 |
```
|
|
|
35 |
base_model: nvidia/Llama-3.1-Nemotron-8B-UltraLong-4M-Instruct
|
36 |
dtype: bfloat16
|
37 |
parameters:
|
38 |
+
t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Nemotron-8B for input & output, ReDistill in the middle layers
|
39 |
|
40 |
```
|