AlfredXu2 commited on
Commit
8ea4f54
·
1 Parent(s): 1555d8d
Files changed (4) hide show
  1. .gitattributes +2 -0
  2. config.json +3 -1
  3. layer.xclbin +3 -0
  4. lm_head.xclbin +3 -0
.gitattributes CHANGED
@@ -1,2 +1,4 @@
1
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
2
  model.q4nx filter=lfs diff=lfs merge=lfs -text
 
 
 
1
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
2
  model.q4nx filter=lfs diff=lfs merge=lfs -text
3
+ layer.xclbin filter=lfs diff=lfs merge=lfs -text
4
+ lm_head.xclbin filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -35,5 +35,7 @@
35
  "torch_dtype": "float32",
36
  "transformers_version": "4.52.0.dev0",
37
  "use_cache": true,
38
- "vocab_size": 128256
 
 
39
  }
 
35
  "torch_dtype": "float32",
36
  "transformers_version": "4.52.0.dev0",
37
  "use_cache": true,
38
+ "vocab_size": 128256,
39
+ "addr_qk": 9216,
40
+ "addr_kv": 34304
41
  }
layer.xclbin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33bb9549061937d2b5ecadec22b6ee257500edb6c4b6980890a0e36d19e9ed7
3
+ size 331003
lm_head.xclbin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28b4bab3cc798c0ce0d149be30b5495ec79bee5e711614c4770b71445917c2bd
3
+ size 152843