dacorvo HF Staff commited on
Commit
6681409
·
verified ·
1 Parent(s): 69f658e

Synchronizing local compiler cache.

Browse files
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev2/inference/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-8B/a7613f1e0925b7136874.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "head_dim": 128, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "checkpoint_revision": "ebf7e8d03db3d86a442d22d30d499abb7ec27bea", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 8.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.15.143.0+e39249ad/MODULE_a89ef5a5abc47372ac48+39f12043/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27277d70287878c1ae246cf16744aa8701ecacedf928e2a5047a09425ae457c9
3
  size 6022144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45061067d2cd47f49237cd76fd3dbbdb369f5e5353755c16a9c651a36184bdc4
3
  size 6022144
neuronxcc-2.15.143.0+e39249ad/MODULE_d0c1049c1f409a3c8074+39f12043/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35496ffcddef3c3a83d63963ed5db8a535a2ae3c85083ff0054dc0c1334b4d5d
3
  size 6063104
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64090d625b4441fdf3a02da937a9208ca54660b37120f3b0dff4b2391aec645a
3
  size 6063104
neuronxcc-2.15.143.0+e39249ad/MODULE_fac5455884c9dfdee723+39f12043/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cef183fb7618558c0a74d7d11be16eb629e931fe2565fa319226a5f875c3cdaf
3
  size 10456064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1782316803bef695366ddf853aef687dff787e9f7d3efb68e30b5d7dcc6b843
3
  size 10456064