Synchronizing local compiler cache.
Browse files- .gitattributes +2 -0
- neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B/f42fa051a05e2d257ef4.json +1 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/compile_flags.json +1 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.done +0 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.hlo_module.pb +3 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.neff +3 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/compile_flags.json +1 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.done +0 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.hlo_module.pb +3 -0
- neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.neff +3 -0
.gitattributes
CHANGED
@@ -7230,3 +7230,5 @@ neuronxcc-2.16.372.0+4a9b2326/MODULE_54ad43f123eecd242b32/vae_decoder/model.neur
|
|
7230 |
neuronxcc-2.16.372.0+4a9b2326/MODULE_54ad43f123eecd242b32/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
7231 |
neuronxcc-2.16.372.0+4a9b2326/MODULE_5d5e4206a466b7852561+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
|
7232 |
neuronxcc-2.16.372.0+4a9b2326/MODULE_b5092ae1e071cef3fe8a+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
7230 |
neuronxcc-2.16.372.0+4a9b2326/MODULE_54ad43f123eecd242b32/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
7231 |
neuronxcc-2.16.372.0+4a9b2326/MODULE_5d5e4206a466b7852561+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
|
7232 |
neuronxcc-2.16.372.0+4a9b2326/MODULE_b5092ae1e071cef3fe8a+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
|
7233 |
+
neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
|
7234 |
+
neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B/f42fa051a05e2d257ef4.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 27648, "max_position_embeddings": 131072, "max_window_layers": 64, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "checkpoint_revision": "3865e12a1eb7cbd641ab3f9dfc28c588c6b0c1e9", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 64, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.done
ADDED
File without changes
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdb9df77a1a3625ab36b1710ccfe5f59ecaef443165e3c6f4438e4568782c0e6
|
3 |
+
size 884860
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_39cb90b37ee6fff24f5d+613edded/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dbf18709e10e2b41a1be5b73528a365fbdd2d53689bff7dcbe7fc9bf68d087d
|
3 |
+
size 3267584
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.done
ADDED
File without changes
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:845fffaec7806ef3a10402cd19203688a9cf944647b5ea1e4f66a733354cc120
|
3 |
+
size 749196
|
neuronxcc-2.16.372.0+4a9b2326/MODULE_45dec79bcb55d7eacd60+613edded/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:387a80bb98ff9b7af4f8bd7e5daeb9e28115d94ffd995ee740b35b557862a165
|
3 |
+
size 8930304
|