upload model

Browse files

Files changed (8) hide show

.gitattributes +1 -0
all_metrics.csv +102 -0
config.json +40 -0
model.neuron +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +15 -0
vocab.txt +0 -0

.gitattributes CHANGED Viewed

@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+model.neuron filter=lfs diff=lfs merge=lfs -text

all_metrics.csv ADDED Viewed

	@@ -0,0 +1,102 @@

+timestamp,run_id,name,subgraph,scope,sub_scope,value,unit,
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,CanonicalizeIR,0.0093994140625,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,ExpandBatchNorm,0.009254693984985352,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,ResolveComplicatePredicates,0.0071446895599365234,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,AffinePredicateResolution,0.008615255355834961,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,EliminateDivs,0.00906991958618164,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TensorOpFusion,0.009348154067993164,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TensorOpTransform,0.034893035888671875,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LowerTensorOp,0.011458396911621094,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,MemcpyElimination,0.8764715194702148,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DeadStoreElimination,0.6812219619750977,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SimplifySlice,0.0030181407928466797,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,PadElimination,0.0003688335418701172,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LoopFusion,0.37325453758239746,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,ValueNumbering,0.0283353328704834,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TCTransform,0.017099857330322266,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,CommuteConcat,0.010370254516601562,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,RecognizeOpIdiom,0.015559911727905273,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,MaskPropagation,0.011378765106201172,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,Recompute,0.0005948543548583984,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DoNothing,9.083747863769531e-05,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,MutateDataType,0.0023496150970458984,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,AutoCastTCInputs,0.003918647766113281,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,GenericAccessSimplifier,0.01243281364440918,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,Simplifier,0.41060328483581543,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,Delinearization,0.03841114044189453,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DelinearIndices,0.015451431274414062,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DeadCodeElimination,0.007534027099609375,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeCCOpLayout,0.003658771514892578,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,InferIntrinsicOnCC,0.050520896911621094,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,ResolveAccessConflict,0.02746438980102539,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LocalLayoutOpt,0.023167848587036133,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,GlobalLayoutOpt,0.3492927551269531,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,CanonicalizeDAG,0.007649421691894531,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,FlattenAxesForTiling,0.008371829986572266,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SundaSizeTiling,0.44942784309387207,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,InferTongaTensor,0.1616523265838623,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,RewriteReplicationMatmul,0.007273435592651367,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DataLocalityOpt,1.1143321990966797,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TilingProfiler,0.009297370910644531,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeSundaMacro,0.022243261337280273,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,PerfectLoopNest,0.016142606735229492,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,RewriteWeights,0.23421001434326172,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,ReshapeWeights,0.004595518112182617,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,FlattenMacroLoop,0.06238913536071777,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyPredicates,0.22608160972595215,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,InferInitValue,0.7848811149597168,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaSimplifier,0.06940984725952148,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyTensor,0.03229641914367676,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LICM,0.10033583641052246,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SundaISel,0.19430756568908691,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaLoopFusion,0.08935689926147461,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,FactorizeBlkDims,0.03960418701171875,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaValueNumbering,0.02214527130126953,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaInstComb,0.2443535327911377,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeMatMult,0.002829313278198242,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeDMA,0.017197132110595703,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LegalizePartitionReduce,0.0033822059631347656,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,PartialLoopFusion,0.08432555198669434,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LowerTranspose,0.037595510482788086,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LateTongaInstComb,0.16178202629089355,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LowerTongaBatchId,0.002024412155151367,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SplitAccGrp,0.003551006317138672,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SpillPSum,0.034529685974121094,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaLICM,0.03946352005004883,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,InferPSumTensor,0.09653544425964355,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,WeightCoalescing,0.014181375503540039,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LowerIntrinsics,0.0035042762756347656,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeSundaAccess,0.02397894859313965,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaAffineLoopXform,0.013040304183959961,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeAllReduce,0.003997087478637695,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,RelaxPredicates,0.007230043411254883,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TensorInitialization,0.00619816780090332,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,TongaSimplifyPredicates,0.012606382369995117,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,ExpandISAMacro,0.005366325378417969,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeType,0.009764671325683594,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyTongaTensor,0.011408090591430664,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DMALocalityOpt,0.0025980472564697266,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DataStreaming,0.009914875030517578,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,PSUMModuloAlloc,0.2481861114501953,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeStreamShuffle,0.004734516143798828,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,CoalesceCCOp,0.003985881805419922,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SimpleAllReduceTiling,0.004281520843505859,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,StaticProfiler,0.015914201736450195,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SplitAPUnionSets,0.05818510055541992,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,SundaLowerGenericAccess,0.0043087005615234375,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,DumpGraphAndMetadata,0.011687755584716797,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg0000,Tensorizer,BirCodeGenLoop,0.11950278282165527,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,root,Tensorizer,All,9.188081979751587,Seconds
+,all-MiniLM-L6-v2-neuronx,TPBCount,None,KELP,None,1,Count
+,all-MiniLM-L6-v2-neuronx,CompilationTime,root,Frontend,0,9.660834789276123,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,all,Frontend,0,9.664303064346313,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg00,HHChecker,0,1.2636184692382812e-05,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,all,HHChecker,0,0.003728151321411133,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,sg00,WalrusDriver,0,0.3347148895263672,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,all,WalrusDriver,0,0.34115004539489746,Seconds
+,all-MiniLM-L6-v2-neuronx,EstimatedLowerBoundLatency,None,KELP,None,0,Milliseconds
+,all-MiniLM-L6-v2-neuronx,EstimatedUpperBoundThroughput,None,KELP,None,0,Count/Second
+,all-MiniLM-L6-v2-neuronx,InferentiaDRAMUsage,None,KELP,None,0,Bytes
+,all-MiniLM-L6-v2-neuronx,CompilationTime,all,Kelper,0,3.2928266525268555,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,root,Pipeline,0,13.31865906715393,Seconds
+,all-MiniLM-L6-v2-neuronx,CompilationTime,all,production_total,None,13.302007913589478,Seconds

config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "sentence-transformers/all-MiniLM-L6-v2",
+  "architectures": [
+    "BertModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "auto_cast": null,
+  "auto_cast_type": null,
+  "classifier_dropout": null,
+  "dynamic_batch_size": true,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 384,
+  "initializer_range": 0.02,
+  "input_names": [
+    "input_ids",
+    "attention_mask",
+    "token_type_ids"
+  ],
+  "intermediate_size": 1536,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "neuron_batch_size": 1,
+  "neuron_sequence_length": 128,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "output_names": [
+    "last_hidden_state",
+    "pooler_output"
+  ],
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torchscript": true,
+  "transformers_version": "4.29.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

model.neuron ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3594009167a9f92e05f76b8415348a850b2d6427a340867ba840a9ebc0a4bbdb
+size 83573752

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff