Jingya HF Staff commited on
Commit
335766f
·
1 Parent(s): 4baaf20
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ model.neuron filter=lfs diff=lfs merge=lfs -text
all_metrics.csv ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ timestamp,run_id,name,subgraph,scope,sub_scope,value,unit,
2
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,CanonicalizeIR,0.017186403274536133,Seconds
3
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,ExpandBatchNorm,0.01916646957397461,Seconds
4
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,ResolveComplicatePredicates,0.014917135238647461,Seconds
5
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,AffinePredicateResolution,0.016184329986572266,Seconds
6
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,EliminateDivs,0.01639723777770996,Seconds
7
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TensorOpFusion,0.01917290687561035,Seconds
8
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TensorOpTransform,0.07087397575378418,Seconds
9
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LowerTensorOp,0.022517681121826172,Seconds
10
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,MemcpyElimination,1.7591924667358398,Seconds
11
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DeadStoreElimination,1.3543994426727295,Seconds
12
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SimplifySlice,0.004833698272705078,Seconds
13
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,PadElimination,0.0003750324249267578,Seconds
14
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LoopFusion,0.6292195320129395,Seconds
15
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,ValueNumbering,0.05216097831726074,Seconds
16
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TCTransform,0.03180551528930664,Seconds
17
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,CommuteConcat,0.017305850982666016,Seconds
18
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,RecognizeOpIdiom,0.02877211570739746,Seconds
19
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,MaskPropagation,0.02014327049255371,Seconds
20
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,Recompute,0.0010938644409179688,Seconds
21
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DoNothing,9.202957153320312e-05,Seconds
22
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,MutateDataType,0.0039331912994384766,Seconds
23
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,AutoCastTCInputs,0.007624387741088867,Seconds
24
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,GenericAccessSimplifier,0.023320674896240234,Seconds
25
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,Simplifier,0.8014688491821289,Seconds
26
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,Delinearization,0.06728005409240723,Seconds
27
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DelinearIndices,0.02657461166381836,Seconds
28
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DeadCodeElimination,0.011566877365112305,Seconds
29
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeCCOpLayout,0.005419015884399414,Seconds
30
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,InferIntrinsicOnCC,0.09969019889831543,Seconds
31
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,ResolveAccessConflict,0.05235028266906738,Seconds
32
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LocalLayoutOpt,0.04341483116149902,Seconds
33
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,GlobalLayoutOpt,0.7055702209472656,Seconds
34
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,CanonicalizeDAG,0.013588666915893555,Seconds
35
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,FlattenAxesForTiling,0.014940977096557617,Seconds
36
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SundaSizeTiling,0.9656670093536377,Seconds
37
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,InferTongaTensor,0.34017038345336914,Seconds
38
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,RewriteReplicationMatmul,0.013017892837524414,Seconds
39
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DataLocalityOpt,2.8061411380767822,Seconds
40
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TilingProfiler,0.016730785369873047,Seconds
41
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeSundaMacro,0.04242563247680664,Seconds
42
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,PerfectLoopNest,0.02962350845336914,Seconds
43
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,RewriteWeights,1.0260913372039795,Seconds
44
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,ReshapeWeights,0.008316755294799805,Seconds
45
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,FlattenMacroLoop,0.1311652660369873,Seconds
46
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyPredicates,0.4593665599822998,Seconds
47
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,InferInitValue,1.6139848232269287,Seconds
48
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaSimplifier,0.14111781120300293,Seconds
49
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyTensor,0.06602692604064941,Seconds
50
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LICM,0.19344878196716309,Seconds
51
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SundaISel,0.381380558013916,Seconds
52
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaLoopFusion,0.20348381996154785,Seconds
53
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,FactorizeBlkDims,0.14890217781066895,Seconds
54
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaValueNumbering,0.04577326774597168,Seconds
55
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaInstComb,0.6017858982086182,Seconds
56
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeMatMult,0.004251718521118164,Seconds
57
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeDMA,0.03434181213378906,Seconds
58
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LegalizePartitionReduce,0.007041454315185547,Seconds
59
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,PartialLoopFusion,0.22039031982421875,Seconds
60
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LowerTranspose,0.07951807975769043,Seconds
61
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LateTongaInstComb,0.39994359016418457,Seconds
62
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LowerTongaBatchId,0.003979682922363281,Seconds
63
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SplitAccGrp,0.007310152053833008,Seconds
64
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SpillPSum,0.14673376083374023,Seconds
65
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaLICM,0.0832223892211914,Seconds
66
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,InferPSumTensor,0.12006378173828125,Seconds
67
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,WeightCoalescing,0.030175209045410156,Seconds
68
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LowerIntrinsics,0.007158994674682617,Seconds
69
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeSundaAccess,0.04524707794189453,Seconds
70
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaAffineLoopXform,0.021468400955200195,Seconds
71
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeAllReduce,0.006783723831176758,Seconds
72
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,RelaxPredicates,0.013041973114013672,Seconds
73
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TensorInitialization,0.006761789321899414,Seconds
74
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,TongaSimplifyPredicates,0.022147417068481445,Seconds
75
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,ExpandISAMacro,0.08670711517333984,Seconds
76
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeType,0.0201413631439209,Seconds
77
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyTongaTensor,0.026923418045043945,Seconds
78
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DMALocalityOpt,0.005611896514892578,Seconds
79
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DataStreaming,0.020259380340576172,Seconds
80
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,PSUMModuloAlloc,0.626401424407959,Seconds
81
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeStreamShuffle,0.009877920150756836,Seconds
82
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,CoalesceCCOp,0.009194374084472656,Seconds
83
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SimpleAllReduceTiling,0.008142232894897461,Seconds
84
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,StaticProfiler,0.032608985900878906,Seconds
85
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SplitAPUnionSets,0.12148618698120117,Seconds
86
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,SundaLowerGenericAccess,0.008048057556152344,Seconds
87
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,DumpGraphAndMetadata,0.023069143295288086,Seconds
88
+ ,bert-base-NER-neuronx,CompilationTime,sg0000,Tensorizer,BirCodeGenLoop,0.2962992191314697,Seconds
89
+ ,bert-base-NER-neuronx,CompilationTime,root,Tensorizer,All,19.601213693618774,Seconds
90
+ ,bert-base-NER-neuronx,TPBCount,None,KELP,None,1,Count
91
+ ,bert-base-NER-neuronx,CompilationTime,root,Frontend,0,20.514663457870483,Seconds
92
+ ,bert-base-NER-neuronx,CompilationTime,all,Frontend,0,20.519617319107056,Seconds
93
+ ,bert-base-NER-neuronx,CompilationTime,sg00,HHChecker,0,6.9141387939453125e-06,Seconds
94
+ ,bert-base-NER-neuronx,CompilationTime,all,HHChecker,0,0.004280805587768555,Seconds
95
+ ,bert-base-NER-neuronx,CompilationTime,sg00,WalrusDriver,0,1.3388400077819824,Seconds
96
+ ,bert-base-NER-neuronx,CompilationTime,all,WalrusDriver,0,1.3458526134490967,Seconds
97
+ ,bert-base-NER-neuronx,EstimatedLowerBoundLatency,None,KELP,None,0,Milliseconds
98
+ ,bert-base-NER-neuronx,EstimatedUpperBoundThroughput,None,KELP,None,0,Count/Second
99
+ ,bert-base-NER-neuronx,InferentiaDRAMUsage,None,KELP,None,0,Bytes
100
+ ,bert-base-NER-neuronx,CompilationTime,all,Kelper,0,4.668492078781128,Seconds
101
+ ,bert-base-NER-neuronx,CompilationTime,root,Pipeline,0,26.555312633514404,Seconds
102
+ ,bert-base-NER-neuronx,CompilationTime,all,production_total,None,26.53824281692505,Seconds
config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "dslim/bert-base-NER",
3
+ "_num_labels": 9,
4
+ "architectures": [
5
+ "BertForTokenClassification"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.1,
8
+ "auto_cast": null,
9
+ "auto_cast_type": null,
10
+ "classifier_dropout": null,
11
+ "dynamic_batch_size": true,
12
+ "hidden_act": "gelu",
13
+ "hidden_dropout_prob": 0.1,
14
+ "hidden_size": 768,
15
+ "id2label": {
16
+ "0": "O",
17
+ "1": "B-MISC",
18
+ "2": "I-MISC",
19
+ "3": "B-PER",
20
+ "4": "I-PER",
21
+ "5": "B-ORG",
22
+ "6": "I-ORG",
23
+ "7": "B-LOC",
24
+ "8": "I-LOC"
25
+ },
26
+ "initializer_range": 0.02,
27
+ "input_names": [
28
+ "input_ids",
29
+ "attention_mask",
30
+ "token_type_ids"
31
+ ],
32
+ "intermediate_size": 3072,
33
+ "label2id": {
34
+ "B-LOC": 7,
35
+ "B-MISC": 1,
36
+ "B-ORG": 5,
37
+ "B-PER": 3,
38
+ "I-LOC": 8,
39
+ "I-MISC": 2,
40
+ "I-ORG": 6,
41
+ "I-PER": 4,
42
+ "O": 0
43
+ },
44
+ "layer_norm_eps": 1e-12,
45
+ "max_position_embeddings": 512,
46
+ "model_type": "bert",
47
+ "neuron_batch_size": 1,
48
+ "neuron_sequence_length": 128,
49
+ "num_attention_heads": 12,
50
+ "num_hidden_layers": 12,
51
+ "output_names": [
52
+ "logits"
53
+ ],
54
+ "output_past": true,
55
+ "pad_token_id": 0,
56
+ "position_embedding_type": "absolute",
57
+ "torchscript": true,
58
+ "transformers_version": "4.29.2",
59
+ "type_vocab_size": 2,
60
+ "use_cache": true,
61
+ "vocab_size": 28996
62
+ }
model.neuron ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:213d9250f75b92507ab889df62f663fe19e5dc1822ec1d7a49c8be54370d588d
3
+ size 400559352
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "clean_up_tokenization_spaces": true,
3
+ "cls_token": "[CLS]",
4
+ "do_basic_tokenize": true,
5
+ "do_lower_case": false,
6
+ "mask_token": "[MASK]",
7
+ "max_len": 512,
8
+ "model_max_length": 512,
9
+ "never_split": null,
10
+ "pad_token": "[PAD]",
11
+ "sep_token": "[SEP]",
12
+ "strip_accents": null,
13
+ "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "BertTokenizer",
15
+ "unk_token": "[UNK]"
16
+ }
vocab.txt ADDED
The diff for this file is too large to render. See raw diff