danielhanchen commited on
Commit
32adcc5
·
verified ·
1 Parent(s): cc41504

Add files using upload-large-folder tool

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ figures/benchmark.jpg filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -37,15 +37,6 @@
37
  "q_lora_rank": 1536,
38
  "qk_nope_head_dim": 128,
39
  "qk_rope_head_dim": 64,
40
- "quantization_config": {
41
- "activation_scheme": "dynamic",
42
- "fmt": "e4m3",
43
- "quant_method": "fp8",
44
- "weight_block_size": [
45
- 128,
46
- 128
47
- ]
48
- },
49
  "rms_norm_eps": 1e-06,
50
  "rope_scaling": {
51
  "beta_fast": 32,
@@ -64,7 +55,8 @@
64
  "topk_group": 4,
65
  "topk_method": "noaux_tc",
66
  "torch_dtype": "bfloat16",
67
- "transformers_version": "4.46.3",
 
68
  "use_cache": true,
69
  "v_head_dim": 128,
70
  "vocab_size": 129280
 
37
  "q_lora_rank": 1536,
38
  "qk_nope_head_dim": 128,
39
  "qk_rope_head_dim": 64,
 
 
 
 
 
 
 
 
 
40
  "rms_norm_eps": 1e-06,
41
  "rope_scaling": {
42
  "beta_fast": 32,
 
55
  "topk_group": 4,
56
  "topk_method": "noaux_tc",
57
  "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.48.1",
59
+ "unsloth_fixed": true,
60
  "use_cache": true,
61
  "v_head_dim": 128,
62
  "vocab_size": 129280
model-00001-of-000163.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2388e6b127ce6664e35c5e2529c3ce4bfc99f4f7fb6fa48e92b29ed5e4922af
3
- size 5234139343
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e87b89ead036e72853e1d7cf48136d40d85b90cc242944e58aa7f88900092f
3
+ size 8609454256
model-00002-of-000163.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f450c75da7eb897b74a092eee65df8bb115fce81cccd2bbaeb220bd97197875
3
- size 4302383966
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b620aa86006f54aac8d8453e9370cb8411119e3038e13df0bce82ebd954729f1
3
+ size 8602553952
model-00003-of-000163.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c79b3418357348d089e88f9de17ac52d7b7a1cfe5dfc7c1b2f1ac1451298b080
3
- size 4302384375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0be9a653c37d1b3d0817a4721349491cee42c9e5ff0c8658a31dc2291cf1db14
3
+ size 8602554152