dacorvo HF Staff commited on
Commit
e7ce9de
·
verified ·
1 Parent(s): 71993be

Synchronizing local compiler cache.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +10 -0
  2. neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.3.1.dev7/wav2vec2/hf-internal-testing/tiny-random-Wav2Vec2Model/3fb52d732cf73210c52f.json +113 -0
  3. neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/f2e7995fb50bc34695b8.json +87 -0
  4. neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/f6847065b14c4394e8d2.json +87 -0
  5. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/compile_flags.json +1 -0
  6. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.done +0 -0
  7. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.hlo_module.pb +3 -0
  8. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.neff +3 -0
  9. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/wrapped_neff.hlo +3 -0
  10. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.hlo_module.pb +1 -1
  11. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.neff +1 -1
  12. neuronxcc-2.21.18209.0+043b1bf7/MODULE_1023294089137432912+e30acd3a/model.neff +0 -0
  13. neuronxcc-2.21.18209.0+043b1bf7/MODULE_10907752543637211265+e30acd3a/model.neff +0 -0
  14. neuronxcc-2.21.18209.0+043b1bf7/MODULE_10945286243277389437+e30acd3a/model.neff +0 -0
  15. neuronxcc-2.21.18209.0+043b1bf7/MODULE_11400907432531398953+e30acd3a/model.neff +0 -0
  16. neuronxcc-2.21.18209.0+043b1bf7/MODULE_12311847081050718470+e30acd3a/model.neff +0 -0
  17. neuronxcc-2.21.18209.0+043b1bf7/MODULE_12324009378304635855+e30acd3a/model.neff +0 -0
  18. neuronxcc-2.21.18209.0+043b1bf7/MODULE_12509236927544110827+e30acd3a/model.neff +0 -0
  19. neuronxcc-2.21.18209.0+043b1bf7/MODULE_12650363609878702055+e30acd3a/model.neff +0 -0
  20. neuronxcc-2.21.18209.0+043b1bf7/MODULE_12666804432653521811+e30acd3a/model.neff +0 -0
  21. neuronxcc-2.21.18209.0+043b1bf7/MODULE_1277765475941548362+e30acd3a/model.neff +0 -0
  22. neuronxcc-2.21.18209.0+043b1bf7/MODULE_12795949123662846630+e30acd3a/model.neff +0 -0
  23. neuronxcc-2.21.18209.0+043b1bf7/MODULE_13092192882592555392+e30acd3a/model.neff +0 -0
  24. neuronxcc-2.21.18209.0+043b1bf7/MODULE_13129006844218143067+e30acd3a/model.neff +0 -0
  25. neuronxcc-2.21.18209.0+043b1bf7/MODULE_13163168066471565112+e30acd3a/model.neff +0 -0
  26. neuronxcc-2.21.18209.0+043b1bf7/MODULE_13385766575326555678+e30acd3a/model.neff +0 -0
  27. neuronxcc-2.21.18209.0+043b1bf7/MODULE_13521002922414225272+e30acd3a/model.neff +0 -0
  28. neuronxcc-2.21.18209.0+043b1bf7/MODULE_13673338043232097095+e30acd3a/model.neff +0 -0
  29. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14024125047097359821+e30acd3a/model.neff +0 -0
  30. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/compile_flags.json +1 -0
  31. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.done +0 -0
  32. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.hlo_module.pb +3 -0
  33. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.neff +3 -0
  34. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14406838977173684020+e30acd3a/model.neff +0 -0
  35. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14488951057292576015+e30acd3a/model.neff +0 -0
  36. neuronxcc-2.21.18209.0+043b1bf7/MODULE_14607415948795306857+e30acd3a/model.neff +0 -0
  37. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15104978417860996248+e30acd3a/model.neff +0 -0
  38. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15195479995167874327+e30acd3a/model.neff +0 -0
  39. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15226158922329678840+e30acd3a/model.neff +0 -0
  40. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15445992300537187360+e30acd3a/model.neff +0 -0
  41. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15549583432468528942+e30acd3a/model.neff +0 -0
  42. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15883166014121986340+e30acd3a/model.neff +0 -0
  43. neuronxcc-2.21.18209.0+043b1bf7/MODULE_15974718484747567133+e30acd3a/model.neff +0 -0
  44. neuronxcc-2.21.18209.0+043b1bf7/MODULE_16063773584643651549+e30acd3a/model.neff +0 -0
  45. neuronxcc-2.21.18209.0+043b1bf7/MODULE_16540141349946602462+e30acd3a/model.neff +0 -0
  46. neuronxcc-2.21.18209.0+043b1bf7/MODULE_1659424179484095552+e30acd3a/model.neff +0 -0
  47. neuronxcc-2.21.18209.0+043b1bf7/MODULE_17037369046574255528+e30acd3a/model.neff +0 -0
  48. neuronxcc-2.21.18209.0+043b1bf7/MODULE_17162153672426857671+e30acd3a/model.neff +0 -0
  49. neuronxcc-2.21.18209.0+043b1bf7/MODULE_17184761711863280677+e30acd3a/model.neff +0 -0
  50. neuronxcc-2.21.18209.0+043b1bf7/MODULE_17685401492131160329+e30acd3a/model.neff +0 -0
.gitattributes CHANGED
@@ -5485,3 +5485,13 @@ neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.neff
5485
  neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5486
  neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text
5487
  neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
5485
  neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5486
  neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text
5487
  neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5488
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
5489
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5490
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5491
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_37a815b3d3073ff820db+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
5492
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_37a815b3d3073ff820db+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5493
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_3fb52d732cf73210c52f/model.neuron filter=lfs diff=lfs merge=lfs -text
5494
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_962a482f90524ff403f5+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5495
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_accf1fdc5eb1cee6c292+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
5496
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_accf1fdc5eb1cee6c292+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5497
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_b79a786451ff8fc0676d+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.3.1.dev7/wav2vec2/hf-internal-testing/tiny-random-Wav2Vec2Model/3fb52d732cf73210c52f.json ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "hf-internal-testing/tiny-random-Wav2Vec2Model",
4
+ "_task": "audio-xvector",
5
+ "activation_dropout": 0.1,
6
+ "adapter_attn_dim": null,
7
+ "adapter_kernel_size": 3,
8
+ "adapter_stride": 2,
9
+ "add_adapter": false,
10
+ "apply_spec_augment": true,
11
+ "architectures": [
12
+ "Wav2Vec2Model"
13
+ ],
14
+ "attention_dropout": 0.1,
15
+ "classifier_proj_size": 256,
16
+ "codevector_dim": 256,
17
+ "contrastive_logits_temperature": 0.1,
18
+ "conv_bias": false,
19
+ "conv_dim": [
20
+ 32,
21
+ 32,
22
+ 32
23
+ ],
24
+ "conv_kernel": [
25
+ 8,
26
+ 8,
27
+ 8
28
+ ],
29
+ "conv_stride": [
30
+ 4,
31
+ 4,
32
+ 4
33
+ ],
34
+ "ctc_loss_reduction": "sum",
35
+ "ctc_zero_infinity": false,
36
+ "diversity_loss_weight": 0.1,
37
+ "do_stable_layer_norm": false,
38
+ "feat_extract_activation": "gelu",
39
+ "feat_extract_dropout": 0.0,
40
+ "feat_extract_norm": "group",
41
+ "feat_proj_dropout": 0.0,
42
+ "feat_quantizer_dropout": 0.0,
43
+ "final_dropout": 0.1,
44
+ "hidden_act": "gelu",
45
+ "hidden_dropout": 0.1,
46
+ "hidden_dropout_prob": 0.1,
47
+ "hidden_size": 16,
48
+ "initializer_range": 0.02,
49
+ "intermediate_size": 20,
50
+ "layer_norm_eps": 1e-05,
51
+ "layerdrop": 0.1,
52
+ "mask_feature_length": 10,
53
+ "mask_feature_min_masks": 0,
54
+ "mask_feature_prob": 0.0,
55
+ "mask_time_length": 2,
56
+ "mask_time_min_masks": 2,
57
+ "mask_time_prob": 0.5,
58
+ "model_type": "wav2vec2",
59
+ "neuron": {
60
+ "auto_cast": null,
61
+ "auto_cast_type": null,
62
+ "compiler_type": "neuronx-cc",
63
+ "compiler_version": "2.21.18209.0+043b1bf7",
64
+ "cpu_backend": false,
65
+ "disable_fallback": false,
66
+ "disable_fast_relayout": false,
67
+ "dynamic_batch_size": true,
68
+ "float_dtype": "fp32",
69
+ "inline_weights_to_neff": true,
70
+ "input_names": [
71
+ "input_values"
72
+ ],
73
+ "int_dtype": "int64",
74
+ "model_type": "wav2vec2",
75
+ "optlevel": "2",
76
+ "output_attentions": false,
77
+ "output_hidden_states": false,
78
+ "output_names": [
79
+ "logits",
80
+ "embeddings"
81
+ ],
82
+ "static_audio_sequence_length": 100000,
83
+ "static_batch_size": 1,
84
+ "task": "audio-xvector",
85
+ "tensor_parallel_size": 1
86
+ },
87
+ "num_adapter_layers": 1,
88
+ "num_attention_heads": 2,
89
+ "num_codevector_groups": 2,
90
+ "num_codevectors_per_group": 320,
91
+ "num_conv_pos_embedding_groups": 2,
92
+ "num_conv_pos_embeddings": 16,
93
+ "num_feat_extract_layers": 3,
94
+ "num_hidden_layers": 4,
95
+ "num_negatives": 100,
96
+ "output_hidden_size": 16,
97
+ "proj_codevector_dim": 256,
98
+ "tdnn_dilation": [
99
+ 1,
100
+ 2
101
+ ],
102
+ "tdnn_dim": [
103
+ 32,
104
+ 32
105
+ ],
106
+ "tdnn_kernel": [
107
+ 5,
108
+ 3
109
+ ],
110
+ "use_weighted_layer_sum": false,
111
+ "vocab_size": 32,
112
+ "xvector_output_dim": 32
113
+ }
neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/f2e7995fb50bc34695b8.json ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "Qwen/Qwen3-Embedding-0.6B",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "Qwen3ForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 1024,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "layer_types": [
17
+ "full_attention",
18
+ "full_attention",
19
+ "full_attention",
20
+ "full_attention",
21
+ "full_attention",
22
+ "full_attention",
23
+ "full_attention",
24
+ "full_attention",
25
+ "full_attention",
26
+ "full_attention",
27
+ "full_attention",
28
+ "full_attention",
29
+ "full_attention",
30
+ "full_attention",
31
+ "full_attention",
32
+ "full_attention",
33
+ "full_attention",
34
+ "full_attention",
35
+ "full_attention",
36
+ "full_attention",
37
+ "full_attention",
38
+ "full_attention",
39
+ "full_attention",
40
+ "full_attention",
41
+ "full_attention",
42
+ "full_attention",
43
+ "full_attention",
44
+ "full_attention"
45
+ ],
46
+ "max_position_embeddings": 32768,
47
+ "max_window_layers": 28,
48
+ "model_type": "qwen3",
49
+ "neuron": {
50
+ "_serialized_key": "NxDNeuronConfig",
51
+ "batch_size": 1,
52
+ "capacity_factor": null,
53
+ "checkpoint_id": "Qwen/Qwen3-Embedding-0.6B",
54
+ "checkpoint_revision": "c54f2e6e80b2d7b7de06f51cec4959f6b3e03418",
55
+ "continuous_batching": false,
56
+ "ep_degree": 1,
57
+ "fused_qkv": true,
58
+ "glu_mlp": true,
59
+ "local_ranks_size": 1,
60
+ "max_batch_size": 1,
61
+ "max_context_length": 1024,
62
+ "max_topk": 256,
63
+ "n_active_tokens": 1024,
64
+ "neuronxcc_version": "2.21.18209.0+043b1bf7",
65
+ "on_device_sampling": false,
66
+ "optimum_neuron_version": "0.4.2.dev0",
67
+ "output_logits": false,
68
+ "pp_degree": 1,
69
+ "sequence_length": 1024,
70
+ "speculation_length": 0,
71
+ "start_rank_id": 0,
72
+ "target": "trn1",
73
+ "torch_dtype": "bfloat16",
74
+ "tp_degree": 1
75
+ },
76
+ "num_attention_heads": 16,
77
+ "num_hidden_layers": 28,
78
+ "num_key_value_heads": 8,
79
+ "rms_norm_eps": 1e-06,
80
+ "rope_scaling": null,
81
+ "rope_theta": 1000000,
82
+ "sliding_window": null,
83
+ "tie_word_embeddings": true,
84
+ "use_cache": true,
85
+ "use_sliding_window": false,
86
+ "vocab_size": 151669
87
+ }
neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/f6847065b14c4394e8d2.json ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "Qwen/Qwen3-Embedding-0.6B",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "Qwen3ForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 1024,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "layer_types": [
17
+ "full_attention",
18
+ "full_attention",
19
+ "full_attention",
20
+ "full_attention",
21
+ "full_attention",
22
+ "full_attention",
23
+ "full_attention",
24
+ "full_attention",
25
+ "full_attention",
26
+ "full_attention",
27
+ "full_attention",
28
+ "full_attention",
29
+ "full_attention",
30
+ "full_attention",
31
+ "full_attention",
32
+ "full_attention",
33
+ "full_attention",
34
+ "full_attention",
35
+ "full_attention",
36
+ "full_attention",
37
+ "full_attention",
38
+ "full_attention",
39
+ "full_attention",
40
+ "full_attention",
41
+ "full_attention",
42
+ "full_attention",
43
+ "full_attention",
44
+ "full_attention"
45
+ ],
46
+ "max_position_embeddings": 32768,
47
+ "max_window_layers": 28,
48
+ "model_type": "qwen3",
49
+ "neuron": {
50
+ "_serialized_key": "NxDNeuronConfig",
51
+ "batch_size": 1,
52
+ "capacity_factor": null,
53
+ "checkpoint_id": "Qwen/Qwen3-Embedding-0.6B",
54
+ "checkpoint_revision": "c54f2e6e80b2d7b7de06f51cec4959f6b3e03418",
55
+ "continuous_batching": false,
56
+ "ep_degree": 1,
57
+ "fused_qkv": true,
58
+ "glu_mlp": true,
59
+ "local_ranks_size": 24,
60
+ "max_batch_size": 1,
61
+ "max_context_length": 1024,
62
+ "max_topk": 256,
63
+ "n_active_tokens": 1024,
64
+ "neuronxcc_version": "2.21.18209.0+043b1bf7",
65
+ "on_device_sampling": true,
66
+ "optimum_neuron_version": "0.4.2.dev0",
67
+ "output_logits": false,
68
+ "pp_degree": 1,
69
+ "sequence_length": 1024,
70
+ "speculation_length": 0,
71
+ "start_rank_id": 0,
72
+ "target": "trn1",
73
+ "torch_dtype": "bfloat16",
74
+ "tp_degree": 24
75
+ },
76
+ "num_attention_heads": 16,
77
+ "num_hidden_layers": 28,
78
+ "num_key_value_heads": 8,
79
+ "rms_norm_eps": 1e-06,
80
+ "rope_scaling": null,
81
+ "rope_theta": 1000000,
82
+ "sliding_window": null,
83
+ "tie_word_embeddings": true,
84
+ "use_cache": true,
85
+ "use_sliding_window": false,
86
+ "vocab_size": 151669
87
+ }
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a6ce6eb6a6e9092fb242da88b081169884a4e9ffb86c8f61e48dde2a9df68e9
3
+ size 658089
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4b22075302d3aff9fbc0ac3d3830740c1622603352852610cba25e704ec601b
3
+ size 717824
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0586f99d912ae4eebd66+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79fd08910a986ab1b585a9f2e6fbe14c19a3321014652f25f8dd1d1274ebf7ee
3
+ size 853136
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.hlo_module.pb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb0a23b716925f843a16e15f9f0385f067950c8f9f55cd7b3db583ba03b1a7e
3
  size 84807
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e836c6bbdddd0f87e50203756e12757180235ce3d83d59d598f073d7c76e335b
3
  size 84807
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f26bc2e40e6e21bffa40348dd28785a0c5ba6ae26126553c85435559849af5d
3
  size 646144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1fb27b3c750546f4a06036bc56bdc41a2a97288350a5a0427e04855594a6cb1
3
  size 646144
neuronxcc-2.21.18209.0+043b1bf7/MODULE_1023294089137432912+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1023294089137432912+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1023294089137432912+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_10907752543637211265+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10907752543637211265+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10907752543637211265+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_10945286243277389437+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10945286243277389437+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10945286243277389437+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_11400907432531398953+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11400907432531398953+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11400907432531398953+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_12311847081050718470+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12311847081050718470+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12311847081050718470+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_12324009378304635855+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12324009378304635855+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12324009378304635855+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_12509236927544110827+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12509236927544110827+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12509236927544110827+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_12650363609878702055+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12650363609878702055+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12650363609878702055+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_12666804432653521811+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12666804432653521811+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12666804432653521811+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_1277765475941548362+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1277765475941548362+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1277765475941548362+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_12795949123662846630+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12795949123662846630+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12795949123662846630+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_13092192882592555392+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13092192882592555392+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13092192882592555392+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_13129006844218143067+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13129006844218143067+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13129006844218143067+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_13163168066471565112+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13163168066471565112+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13163168066471565112+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_13385766575326555678+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13385766575326555678+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13385766575326555678+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_13521002922414225272+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13521002922414225272+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13521002922414225272+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_13673338043232097095+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13673338043232097095+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_13673338043232097095+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14024125047097359821+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14024125047097359821+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14024125047097359821+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3468b6e74d336f18fe28b6fe457a52cef249b9630225261813c967bf71d19e44
3
+ size 586051
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14271466b8fcc2e97e04+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54408c237472906fdcf6d1aa87649570b887f3690627b94b699d9fc666dea5b
3
+ size 7097344
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14406838977173684020+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14406838977173684020+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14406838977173684020+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14488951057292576015+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14488951057292576015+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14488951057292576015+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_14607415948795306857+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14607415948795306857+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14607415948795306857+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15104978417860996248+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15104978417860996248+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15104978417860996248+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15195479995167874327+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15195479995167874327+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15195479995167874327+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15226158922329678840+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15226158922329678840+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15226158922329678840+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15445992300537187360+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15445992300537187360+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15445992300537187360+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15549583432468528942+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15549583432468528942+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15549583432468528942+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15883166014121986340+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15883166014121986340+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15883166014121986340+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_15974718484747567133+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15974718484747567133+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15974718484747567133+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_16063773584643651549+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_16063773584643651549+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_16063773584643651549+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_16540141349946602462+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_16540141349946602462+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_16540141349946602462+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_1659424179484095552+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1659424179484095552+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1659424179484095552+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_17037369046574255528+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17037369046574255528+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17037369046574255528+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_17162153672426857671+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17162153672426857671+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17162153672426857671+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_17184761711863280677+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17184761711863280677+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17184761711863280677+e30acd3a/model.neff differ
 
neuronxcc-2.21.18209.0+043b1bf7/MODULE_17685401492131160329+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17685401492131160329+e30acd3a/model.neff and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17685401492131160329+e30acd3a/model.neff differ