dacorvo HF Staff commited on
Commit
67c1b1c
·
verified ·
1 Parent(s): 9530eb1

Synchronizing local compiler cache.

Browse files
.gitattributes CHANGED
@@ -2135,3 +2135,5 @@ neuronxcc-2.16.372.0+4a9b2326/MODULE_f7a493b3a1ae24ab8ebb+613edded/model.neff fi
2135
  neuronxcc-2.16.372.0+4a9b2326/MODULE_fa8e5e93b134884838d5+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
2136
  neuronxcc-2.16.372.0+4a9b2326/MODULE_fadc62f786e9e6e1bf75+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
2137
  neuronxcc-2.16.372.0+4a9b2326/MODULE_fce469267b2ad1b5d80e+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
2135
  neuronxcc-2.16.372.0+4a9b2326/MODULE_fa8e5e93b134884838d5+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
2136
  neuronxcc-2.16.372.0+4a9b2326/MODULE_fadc62f786e9e6e1bf75+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
2137
  neuronxcc-2.16.372.0+4a9b2326/MODULE_fce469267b2ad1b5d80e+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
2138
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_8ea2de719456a80196f9+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
2139
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_c064389074584e41f54f+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.2.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/352a3518452cfb4a7d84.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 2, "sequence_length": 1024}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "partial_rotary_factor": 1.0, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.2.0.dev1/inference/qwen2/Qwen/Qwen2.5-0.5B/eb9dc14053f0f9d06257.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 896, "initializer_range": 0.02, "intermediate_size": 4864, "max_position_embeddings": 32768, "max_window_layers": 24, "model_type": "qwen2", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "Qwen/Qwen2.5-0.5B", "checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 14, "num_hidden_layers": 24, "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 1000000.0, "sliding_window": 32768, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "use_mrope": false, "use_sliding_window": false, "vocab_size": 151936}
neuronxcc-2.16.372.0+4a9b2326/MODULE_8ea2de719456a80196f9+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_8ea2de719456a80196f9+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_8ea2de719456a80196f9+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70a8802543e684578f4d74b3e24556882cbf885c69c59a1f9523d4fbf3b85d2f
3
+ size 337934
neuronxcc-2.16.372.0+4a9b2326/MODULE_8ea2de719456a80196f9+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce1e673f3967763de9247527e702341604f8981d6bdd01d1bdb08b295bbf2ff8
3
+ size 5592064
neuronxcc-2.16.372.0+4a9b2326/MODULE_c064389074584e41f54f+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_c064389074584e41f54f+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_c064389074584e41f54f+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40df50a6395a19aaa93b9248a0ffad5d24f388cd8b6cd521a74110ee171df42f
3
+ size 288747
neuronxcc-2.16.372.0+4a9b2326/MODULE_c064389074584e41f54f+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bfeffa62d32ca60e279d6564128bfda0868b442506593eb3349fea571519f91
3
+ size 14418944