fix-future-tokens-n1.5 (#5)
Browse files- update model card with future tokens and rm unused weights (10ee14a1e8960ae6f5473e63a9712cf8774b5b63)
- config.json +1 -0
- model-00001-of-00004.safetensors → model-00001-of-00003.safetensors +0 -0
- model-00002-of-00004.safetensors → model-00002-of-00003.safetensors +2 -2
- model-00003-of-00004.safetensors → model-00003-of-00003.safetensors +2 -2
- model-00004-of-00004.safetensors +0 -3
- model.safetensors.index.json +0 -0
config.json
CHANGED
@@ -44,6 +44,7 @@
|
|
44 |
"architectures": [
|
45 |
"GR00T_N1_5"
|
46 |
],
|
|
|
47 |
"backbone_cfg": {
|
48 |
"eagle_path": "NVEagle/eagle_er-qwen3_1_7B-Siglip2_400M_stage1_5_128gpu_er_v7_1mlp_nops",
|
49 |
"load_bf16": false,
|
|
|
44 |
"architectures": [
|
45 |
"GR00T_N1_5"
|
46 |
],
|
47 |
+
"attn_implementation": null,
|
48 |
"backbone_cfg": {
|
49 |
"eagle_path": "NVEagle/eagle_er-qwen3_1_7B-Siglip2_400M_stage1_5_128gpu_er_v7_1mlp_nops",
|
50 |
"load_bf16": false,
|
model-00001-of-00004.safetensors → model-00001-of-00003.safetensors
RENAMED
File without changes
|
model-00002-of-00004.safetensors → model-00002-of-00003.safetensors
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03ba0f11339d5ed24920582781c7352e308eb4eb78067c128bd8516b146656c8
|
3 |
+
size 1996145888
|
model-00003-of-00004.safetensors → model-00003-of-00003.safetensors
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f572eb204d7afe3ddbfb890ca56eac1a9bafbdce51ed6fd3ba314dc4298d565
|
3 |
+
size 1455454240
|
model-00004-of-00004.safetensors
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:0f2ce816d725c22977fdc0e7e37468c5b8eb7bfb07f8d040e7617c0d1def56cb
|
3 |
-
size 1856960528
|
|
|
|
|
|
|
|
model.safetensors.index.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|