Synchronizing local compiler cache.
Browse files- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/gpt2/hf-internal-testing/tiny-random-gpt2/637e4d9b46a55a4bd378.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/mixtral/dacorvo/Mixtral-tiny/f8481d38d5385e766e16.json +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_155a5e57960474557323+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_155a5e57960474557323+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_155a5e57960474557323+2c2d707e/model.neff +0 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_76901e390efc58ac4dd9+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_76901e390efc58ac4dd9+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_76901e390efc58ac4dd9+2c2d707e/model.neff +0 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_dce0056010051b49469f+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_dce0056010051b49469f+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_dce0056010051b49469f+2c2d707e/model.neff +0 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_e75ea02f5df3e2da3d47+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_e75ea02f5df3e2da3d47+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_e75ea02f5df3e2da3d47+2c2d707e/model.neff +0 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_faa46569f7ab44a3175c+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_faa46569f7ab44a3175c+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_faa46569f7ab44a3175c+2c2d707e/model.neff +0 -0
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/gpt2/hf-internal-testing/tiny-random-gpt2/637e4d9b46a55a4bd378.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"activation_function": "gelu_new", "attention_probs_dropout_prob": 0.1, "attn_pdrop": 0.1, "bos_token_id": 98, "embd_pdrop": 0.1, "eos_token_id": 98, "gradient_checkpointing": false, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "initializer_range": 0.02, "intermediate_size": 37, "layer_norm_epsilon": 1e-05, "model_type": "gpt2", "n_ctx": 512, "n_embd": 32, "n_head": 4, "n_inner": null, "n_layer": 5, "n_positions": 512, "neuron": {"auto_cast_type": "fp32", "batch_size": 1, "checkpoint_id": "hf-internal-testing/tiny-random-gpt2", "checkpoint_revision": "71034c5d8bde858ff824298bdedc65515b97d2b9", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 24, "sequence_length": 512, "task": "text-generation"}, "pad_token_id": 98, "reorder_and_upcast_attn": false, "resid_pdrop": 0.1, "scale_attn_by_inverse_layer_idx": false, "scale_attn_weights": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "summary_type": "cls_index", "summary_use_proj": true, "type_vocab_size": 16, "use_cache": true, "vocab_size": 1000}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/mixtral/dacorvo/Mixtral-tiny/f8481d38d5385e766e16.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MixtralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 1024, "initializer_range": 0.02, "intermediate_size": 3584, "max_position_embeddings": 1024, "model_type": "mixtral", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "dacorvo/Mixtral-tiny", "checkpoint_revision": "c557ba205ddff6ea911f4719e0d543d6c08356b6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 2, "sequence_length": 1024, "task": "text-generation"}, "num_attention_heads": 32, "num_experts_per_tok": 2, "num_hidden_layers": 2, "num_key_value_heads": 8, "num_local_experts": 8, "output_router_logits": false, "rms_norm_eps": 1e-05, "rope_theta": 10000.0, "router_aux_loss_coef": 0.001, "router_jitter_noise": 0.0, "sliding_window": 4096, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.213.0+013d129b/MODULE_155a5e57960474557323+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_155a5e57960474557323+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d2b7cfc39de1bbc0693534e4faba59fe43ff37fd76c9f9687e84b9695c6bdda
|
3 |
+
size 56790
|
neuronxcc-2.14.213.0+013d129b/MODULE_155a5e57960474557323+2c2d707e/model.neff
ADDED
Binary file (144 kB). View file
|
|
neuronxcc-2.14.213.0+013d129b/MODULE_76901e390efc58ac4dd9+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_76901e390efc58ac4dd9+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acde1e609fafc64814865b8fe9930c942944f7f4ec97345a18e2381754f876b2
|
3 |
+
size 2141727
|
neuronxcc-2.14.213.0+013d129b/MODULE_76901e390efc58ac4dd9+2c2d707e/model.neff
ADDED
Binary file (933 kB). View file
|
|
neuronxcc-2.14.213.0+013d129b/MODULE_dce0056010051b49469f+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_dce0056010051b49469f+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64c24e66e02425f78db74751c80934cac54bb70bd103acb351ff6ef5b10f3648
|
3 |
+
size 45729
|
neuronxcc-2.14.213.0+013d129b/MODULE_dce0056010051b49469f+2c2d707e/model.neff
ADDED
Binary file (462 kB). View file
|
|
neuronxcc-2.14.213.0+013d129b/MODULE_e75ea02f5df3e2da3d47+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_e75ea02f5df3e2da3d47+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f1a0d1a9d00ee5f9cee3ac6d5eb29d1171e37f847cc53d235e9180be00aa5cf
|
3 |
+
size 56790
|
neuronxcc-2.14.213.0+013d129b/MODULE_e75ea02f5df3e2da3d47+2c2d707e/model.neff
ADDED
Binary file (144 kB). View file
|
|
neuronxcc-2.14.213.0+013d129b/MODULE_faa46569f7ab44a3175c+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_faa46569f7ab44a3175c+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fb59bd47e3d45277c298cb73390d5684363c184803fa17cdefecfd63a9a23c2
|
3 |
+
size 56790
|
neuronxcc-2.14.213.0+013d129b/MODULE_faa46569f7ab44a3175c+2c2d707e/model.neff
ADDED
Binary file (155 kB). View file
|
|