AlfredXu2 commited on
Commit
a329e7e
·
1 Parent(s): b2d3dba

add_npu_spec

Browse files
Files changed (1) hide show
  1. config.json +5 -1
config.json CHANGED
@@ -35,5 +35,9 @@
35
  "torch_dtype": "bfloat16",
36
  "transformers_version": "4.45.0.dev0",
37
  "use_cache": true,
38
- "vocab_size": 128256
 
 
 
 
39
  }
 
35
  "torch_dtype": "bfloat16",
36
  "transformers_version": "4.45.0.dev0",
37
  "use_cache": true,
38
+ "vocab_size": 128256,
39
+ "layer_bin_name": "llama_1b.xclbin",
40
+ "lm_head_bin_name": "lm_head_1b.xclbin",
41
+ "addr_qk": 5120,
42
+ "addr_kv": 33792
43
  }