Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +46 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/0a57352c7fd763b555b2.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/2ef2288f29598787f90a.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/543d5a298da978bf2eea.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/6a2580f82abbca39b7e8.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/75b6ae752be0874692b5.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/7e85d17ae4dd9b3a2d88.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/8b6180d315737ae80d68.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/913714c63b99d90a6ae1.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/a461fa3d6df803f907a6.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/ab331eba159ded1807f7.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/b9955896a71dfc78f28d.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/bf28cc6b9d14110257b6.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/f2c580dbc2713a5d9234.json +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/model.neff +3 -0
.gitattributes
CHANGED
@@ -3259,3 +3259,49 @@ neuronxcc-2.13.66.0+6dfecc895/MODULE_291179394533923841+abb26765/model.neff filt
|
|
3259 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_8896680080935756983+abb26765/model.neff filter=lfs diff=lfs merge=lfs -text
|
3260 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_8968847275564604714+abb26765/model.neff filter=lfs diff=lfs merge=lfs -text
|
3261 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_9623917463913047246+abb26765/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3259 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_8896680080935756983+abb26765/model.neff filter=lfs diff=lfs merge=lfs -text
|
3260 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_8968847275564604714+abb26765/model.neff filter=lfs diff=lfs merge=lfs -text
|
3261 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_9623917463913047246+abb26765/model.neff filter=lfs diff=lfs merge=lfs -text
|
3262 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3263 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3264 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3265 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3266 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3267 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3268 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3269 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3270 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3271 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3272 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3273 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3274 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_510d1b3e787db5d64500+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3275 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_53f2b9aee6106a9f4dcd+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3276 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_5eda50b31e5c582e2878+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3277 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_6170b5f2281ca826c2b2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3278 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_667659b5880c8aa3c228+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3279 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_688776c29ec37ba82856+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3280 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_763de59456afcb367149+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3281 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_7a376947f78404875f58+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3282 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_7cf624dfa838c61f3c6b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3283 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_7e3464a9e0f1d4136a66+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3284 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_882ba05b08198c8f905e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3285 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_8fa8787f9d1cb78bf2ca+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3286 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_96197eb9bd55505ed7ef+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3287 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_968bf6eacaf5303d4c8e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3288 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_97b9e95fa2daba9493e8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3289 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_9b1aff5346a817ad5d9f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3290 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_9d1992f0aab64038d9c9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3291 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_a16cad38f886c688ecef+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3292 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_aa23de623dd5e61f2b48+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3293 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_b62de3426c2cdf3bead4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3294 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_b99af071064810447719+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3295 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_b9bbef4437ef03c29568+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3296 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_bbc6a6451a22be51978b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3297 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_bcf852ae9f12d5ae27f8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3298 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_c1086afddb9cd4007def+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3299 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_cb2eb76a11d88856d152+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3300 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_d2a5e6fd24b065f29396+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3301 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_d3c9c5fa2608e9fa1b87+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3302 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_e4be7b4851b279b21c24+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3303 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_e774925ef02cac9260be+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3304 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_e9cd7823552b4052fd1f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3305 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_f06eb185da899bd94560+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3306 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_f5782d94847d0a80b7d3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3307 |
+
neuronxcc-2.14.182.0+a56cbff7/MODULE_fdf13076ef71fca7878d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/0a57352c7fd763b555b2.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 24, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/2ef2288f29598787f90a.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/543d5a298da978bf2eea.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/6a2580f82abbca39b7e8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/75b6ae752be0874692b5.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 24, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/7e85d17ae4dd9b3a2d88.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 30, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/8b6180d315737ae80d68.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/913714c63b99d90a6ae1.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/a461fa3d6df803f907a6.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/ab331eba159ded1807f7.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/b9955896a71dfc78f28d.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/bf28cc6b9d14110257b6.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/f2c580dbc2713a5d9234.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 48, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.182.0+a56cbff7", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1566e2a8f5b730de18b31d6d8d7c7c419cada8646df6cdc8cc6005fc2a186d3
|
3 |
+
size 310640
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_0687095f8d3aa3ce12d6+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea92cac7ab1c517d5daf84b871358b2edbf3c6d2fca7982a32a5296b8285b197
|
3 |
+
size 2253824
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2c7c74a97521977d7544dcae68780c86710b471b75a7727dc6e3804425b245d
|
3 |
+
size 499775
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_0f8217c0f77d3545d502+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5339e95375d6b462904e4aa55975deab7a212a0608aad243e69fdaa3dd855637
|
3 |
+
size 31540224
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85f62f3312bb3b755f884a1668727749d3edb7c62f5590aa3b004172869bc5b6
|
3 |
+
size 310896
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_17fbd51961c885174794+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8668be9d590a9d2a55047b41a21999695397d9e923ac2aaa3471bfd500d3e7b
|
3 |
+
size 1803264
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24b359f3a640fad8eb963b7fe1d12dbe1380b0bfd3a56e3ac07119c4d217d779
|
3 |
+
size 310896
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aded78a224bafc3dc2856309060b388f04e766fe9b0dd310b309bf9e1803b97
|
3 |
+
size 1854464
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24dac2e5442b3b3a4a7b785e652fa0ecfc8f4d370a56a0f3809651dcc4825474
|
3 |
+
size 399042
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_25a6a99cc992600183b5+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bf991c2097a0abc00903d5e2bb43a6b0e3f528f3a53c737f0ca68d4860e8cea
|
3 |
+
size 13159424
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baa9b0014881a072b233e59c5afbde2120344a511174871b1f69394a80e8a2e3
|
3 |
+
size 316897
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2b1d09ca8c5308643fda+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8a0bd7ca3345e013a7daae38a1a52b812c7daf2e04d7c8e54b896829ef2ae28
|
3 |
+
size 2305024
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:926c3024190b4c30509cf9806c8ea3b153a9dc78ed5ba1dec2a6c859a8bd43fc
|
3 |
+
size 499775
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2d3672e10ea0b9d9c314+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6980ca6fff904b34a1f3f1a4100f37ecc79a1463066b9c93e8e6cd492eaf1255
|
3 |
+
size 31540224
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6cb6ebdf0a6be648ca94f9bf518b59169aaaaa328a32295a74c3db8b0ca2088
|
3 |
+
size 312642
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_2eb386754e54d4bd0df2+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcbed442c9eb1e5f33a97e2cf9f2ea2d08e501ea87c4ec9355a0671b56131513
|
3 |
+
size 2806784
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:102e7a2491f09e10ef994632cf15fb427df7abad5957822356aa76eae8b55cab
|
3 |
+
size 399298
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_3a6b6d9e762081dec573+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2feb5d4a3efd90159fae8c389d92984344d15d4d7b96b59cea0db1a77e298f05
|
3 |
+
size 3625984
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d928706f3b1ec7e521cae55f5911eb92fc44f684cff4bf6a3ba7dbcf5b4e3dff
|
3 |
+
size 399042
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_3dbfc17c978392dd65eb+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d88ebd1aab7f1f27e575d58d436cfc0f6cef09a22ef82862816163d1eecd2020
|
3 |
+
size 4199424
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1de16bf061ebedea621de088148b64b0fb34bb1cb05a14840d02b36a264f5e1
|
3 |
+
size 310640
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_428a161fba1e6e515a29+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:240cc11a83015d2dbb922b1f8c7282e3ed7d5ea7cc2a5e165c8979157da0bbae
|
3 |
+
size 2335744
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a46325e72cb58c370e3a948fda2c775a97147a05d05806f6e16b3ba38eb472eb
|
3 |
+
size 500031
|
neuronxcc-2.14.182.0+a56cbff7/MODULE_4c6bece225fa6802237c+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a069236467e98b9149c6766d389cd49f1634ae4e70ba6149df4fa7a1f922c6a
|
3 |
+
size 26287104
|