optimum-internal-testing-user commited on
Commit
41a6466
·
verified ·
1 Parent(s): 51aeb0a

Synchronizing local compiler cache.

Browse files
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama/llamafactory/tiny-random-Llama-3/5d5179e2ac0b724548b0.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "llamafactory/tiny-random-Llama-3",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "float16",
11
+ "head_dim": 4,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 16,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 64,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 1,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "llamafactory/tiny-random-Llama-3",
24
+ "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8",
25
+ "continuous_batching": false,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 2,
30
+ "max_batch_size": 1,
31
+ "max_context_length": 1024,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 1024,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": true,
36
+ "optimum_neuron_version": "0.4.6.dev3",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "prefill_chunk_size": 0,
40
+ "sequence_length": 1024,
41
+ "speculation_length": 0,
42
+ "start_rank_id": 0,
43
+ "target": "trn1",
44
+ "torch_dtype": "float16",
45
+ "tp_degree": 2
46
+ },
47
+ "num_attention_heads": 4,
48
+ "num_hidden_layers": 2,
49
+ "num_key_value_heads": 4,
50
+ "pretraining_tp": 1,
51
+ "rms_norm_eps": 1e-05,
52
+ "rope_scaling": {
53
+ "factor": 8.0,
54
+ "high_freq_factor": 4.0,
55
+ "low_freq_factor": 1.0,
56
+ "original_max_position_embeddings": 8192,
57
+ "rope_type": "llama3"
58
+ },
59
+ "rope_theta": 500000.0,
60
+ "tie_word_embeddings": false,
61
+ "use_cache": true,
62
+ "vocab_size": 128256
63
+ }
neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.hlo_module.pb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37173b87f2098da51055199893cf6d6b5bc3702f5fca629ddb79f66ed168542f
3
  size 1207180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:631e2888f6ee71acf1c9eb784246d591937aa8de79993a6850177196c2bc8fa2
3
  size 1207180
neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8a417d4b56c38409fb6a94321596dbdec1fbdfd15f15a1ad70defd0cd2990d2
3
  size 58307584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec3da1c0626101d789222ba962ee1f2b30e606a10b59ead008350d5bc0a19e62
3
  size 58307584
neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.hlo_module.pb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:990cedcdabb6c3f81555756a62bf720aa67bcf902b798c5bc0ecb2cb1ec99630
3
  size 839610
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:503f2ba00e01ec69dbbab68e814ed2bb73f646b48b6892b515292a585e9dfe2d
3
  size 839610
neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92c65c63a8e9840b2f33dd94af5dfbcb5f2ab85c916c9e4a9d187aee75c218b2
3
  size 12626944
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac9d8573bdda4cd25a8b90976246d32cdd841ea5e0890eb3aa6f7ee6a972eb94
3
  size 12626944
neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.hlo_module.pb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:179bdac81143630f9d441635b2b26fa7932ed558003eca339746b0003a725b51
3
  size 904767
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df3122b05453bf9f572786aa49b7e5df0168024a8f52330ce2671cc7e157cd81
3
  size 904767
neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e6900510a254b86a4ffcfcd78e3945ce983f70412294bfc4d1601bb1c498a31
3
  size 5827584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6283f00665e3747e029a916a314a7185c78798b530296350881c6422ec1cad72
3
  size 5827584
neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/wrapped_neff.hlo CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78bd99eed94739629493c0119fe7539423a10b254fdc448290f2a690371625a0
3
  size 5994108
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f36761cca5a82603e8d8cb052c52a7b98c82217d90b6c06f094e68d980b82636
3
  size 5994108