Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +60 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/1ab4fec65fe40b15d8fc.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/0c05f781075e377b3fe0.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/5a8294b279e725cf8542.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/735e2b4b3a5019f203a7.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/b4d9aa50677e27d82b4f.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/b57ff0785cfe94aa0718.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.hlo_module.pb.lock +0 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_486c7a82a8c022dff09d+2c2d707e/compile_flags.txt +1 -0
.gitattributes
CHANGED
@@ -2443,3 +2443,63 @@ neuronxcc-2.13.68.0+6dfecc895/MODULE_8451101906021534154+55d6a20f/model.neff fil
|
|
2443 |
neuronxcc-2.13.68.0+6dfecc895/MODULE_913272093888285008+55d6a20f/model.neff filter=lfs diff=lfs merge=lfs -text
|
2444 |
neuronxcc-2.13.68.0+6dfecc895/MODULE_9613391693182017117+55d6a20f/model.neff filter=lfs diff=lfs merge=lfs -text
|
2445 |
neuronxcc-2.13.68.0+6dfecc895/MODULE_9985841552596062342+55d6a20f/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2443 |
neuronxcc-2.13.68.0+6dfecc895/MODULE_913272093888285008+55d6a20f/model.neff filter=lfs diff=lfs merge=lfs -text
|
2444 |
neuronxcc-2.13.68.0+6dfecc895/MODULE_9613391693182017117+55d6a20f/model.neff filter=lfs diff=lfs merge=lfs -text
|
2445 |
neuronxcc-2.13.68.0+6dfecc895/MODULE_9985841552596062342+55d6a20f/model.neff filter=lfs diff=lfs merge=lfs -text
|
2446 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2447 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2448 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2449 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2450 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2451 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2452 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2453 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2454 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2455 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2456 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2457 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2458 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2459 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_486c7a82a8c022dff09d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2460 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_51e280213d3349f527d2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2461 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_549172aa834892c7c7a4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2462 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_566eabca608aba464c36+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2463 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_5874976226b548eb5371+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2464 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6448de0d7cf065f478d5+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2465 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6894a3560ccb6b65e95d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2466 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6ae1c452ac1fdada3eb2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2467 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6d21ace3022d34ab3830+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2468 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6e01e37e53f41097b6b6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2469 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_76f7d0b68aec3cb69d0a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2470 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_78d21abaf2f2d060b22b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2471 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7c1bb27bab9691eba531+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2472 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7e2b745e708288a40519+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2473 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7f81455f54f39113fb16+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2474 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_83df5e0a8e20244654ed+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2475 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_856f02167205261ff8fc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2476 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_86cf0513653fad241ec3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2477 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_89f4ef99a1b9dc2e0376+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2478 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_8b5c27e70924272ec512+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2479 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_8e207a20e91d1dbf8a00+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2480 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_8ffe5fc009f227ac2503+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2481 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_92a4f58f6236c561796c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2482 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_980f9018dc8fd109bdd2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2483 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a2682791cd350ba7a9fe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2484 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a48e6804bafaa4e7ae79+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2485 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a75a2029ddf30ccd71c0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2486 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ae8b47db3e76c14c631a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2487 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_af2d0d551946d2440394+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2488 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_afc09ba31e52cb79957b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2489 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_b2ff93897da9ae5d4230+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2490 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_bcd19bc67db1b3ff4381+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2491 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_c20d4048148f74bd831e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2492 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_c42d9fbc62e7ab02b883+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2493 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_c51d71779e7baf780bdd+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2494 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ce35a7f50500ae68dabb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2495 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_daf677f1de2932b06dee+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2496 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e0428cac0a05340dd6b6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2497 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e0aea0f1fae7e8ea75a8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2498 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e662eba2c35ccc6d0e75+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2499 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e6eefadafc00e030357f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2500 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e8eb76aadbf870ef66cb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2501 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e927a8c1d5e1e8ef193c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2502 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ea3dcabd6c9634a1604e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2503 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_eb62436c86a87d12aabf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2504 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_eeb5873dd3e715b2c510+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2505 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_fba6a92254966a90eb3b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/1ab4fec65fe40b15d8fc.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/0c05f781075e377b3fe0.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/5a8294b279e725cf8542.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/735e2b4b3a5019f203a7.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/b4d9aa50677e27d82b4f.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/b57ff0785cfe94aa0718.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:651742271c27e3721a66cc72c7e9f11b12d1f799e617d176f79559662ea26578
|
3 |
+
size 371259
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_030e33ef5cbb962feaff+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28902f1884a5e127068e71762a083ded1a9b0e1c039d29daf6f67a12249dc8de
|
3 |
+
size 7353344
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16459fcc2a1c86cfba250d4901050bb6648787e6f805b0edf061ecdf5f124463
|
3 |
+
size 300634
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_080e84736415daff8ec2+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71dd89cc6d4fc63b390e068500d43163378c930697cc757160d9d68d01749dbe
|
3 |
+
size 1291264
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd505c607de6390cf3b8a126862c083a8ab007cb2cd942883299a76698f21283
|
3 |
+
size 336719
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0a5bc51ecf53ae664481+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67a5cb0d1c5e44158ff65c346f6e9657115351c0859ac4dbca2e87ff5789bd2e
|
3 |
+
size 17193984
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fba8fb4e8c72e2af5f03448185330da0aa7aca9e6f20b7617e4c93ac5492552d
|
3 |
+
size 421309
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0b46584d966f73defc7f+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c8af71b6dc042988b40ca6ddebc2410af56126f066596c2e5f88b135e8889b0
|
3 |
+
size 4168704
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebd445c9b66fb6771ce2929e49c0b80c8e9a91bd6a5ddef299c6e38181964919
|
3 |
+
size 381723
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_10b9bdbf2c308ea5cfd6+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90e28054c756f72ab289e264aae6a45a821be574fe2daf0ea67b5ceae4565b63
|
3 |
+
size 4066304
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4531ba09afd7b78594a1b6b09ef336c3df931a865d4cba61f45c1e41ddc7a4bb
|
3 |
+
size 397595
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_191faaea815817f18cbc+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:284786819c30e41cdaa6b28f461ecb9736f976229fa94c75d58d332d9a006fc8
|
3 |
+
size 4086784
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daf70394505c59e0fce89e72a2ce531800e8e4fb09a75bf7767b65c339d7ded5
|
3 |
+
size 397595
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_20ae17db0c2c9f8459be+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b02e645ad56d26eb467ad56a81356e9dad0ff220797971cec312ecd621321565
|
3 |
+
size 6247424
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82a0ee7d4822263ee7b716c4adc4ecb394c1189f462d07f3104b4e1522b2dfd8
|
3 |
+
size 375515
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_2ab662af1ee4f42104cc+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bfe2169e8aa30a6cad515c85cecb082d98a154a49866ec556662adf6bffec53
|
3 |
+
size 1967104
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd364110d3886e0ee0a96d5bf7c6315a629aacffed12fcdf49a5611109df22fa
|
3 |
+
size 375515
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3b0708cd079253ab7760+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41e4d53f580bf954ec3835e0102df1b3b6140ac7a95f7aac83eeeae8e9961df5
|
3 |
+
size 1895424
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65ba00c294bb39f12971dc364afe7adb479f5d7b3155fb9ce12949fcc1de962a
|
3 |
+
size 336719
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f04dbee4ab2e153e3c7+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b99e0169b8df8041ca7403ad61a45fb524770c0ed4b797c9b41f78cae86024
|
3 |
+
size 17193984
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51aaf988d2296218e4993687fca20634758e320651a2838a4b4bddcc25b8879f
|
3 |
+
size 300634
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f669e736d8907cd1111+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f707013a5b511194428339464a9f4092adb07ed998869adf358a75c67d6a526a
|
3 |
+
size 1373184
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14820a0d9f6a075345f2c00e1b702e4d78ece4357ebebddf7d65447b4a9b3915
|
3 |
+
size 421309
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_442eda90da2cf2f72c01+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:071268e1d3d477c67089f35bd64635b543fd2ce8dedd6fcc3efce250fcdcc76a
|
3 |
+
size 4189184
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc6b6b5c6cf5a5d3fd013c6a44fce319e59cc1f578131d7e936bf85773bca1b7
|
3 |
+
size 420713
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.hlo_module.pb.lock
ADDED
File without changes
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b543db457fa31e31d199a4ccf7987575d7932894e008ea208153eaa2414e119
|
3 |
+
size 344207
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_475f0e6eb6f4502b945e+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ba46b1e3bab88ac5bbeb8f40a91585ca81ca93399bdc1c0a3c8fdb0a2a9e8b8
|
3 |
+
size 30096384
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_486c7a82a8c022dff09d+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|