File size: 10,955 Bytes
f55088b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
timestamp,run_id,name,subgraph,scope,sub_scope,value,unit,
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,CanonicalizeIR,0.01797008514404297,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,ExpandBatchNorm,0.0183563232421875,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,ResolveComplicatePredicates,0.014789581298828125,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,AffinePredicateResolution,0.01681208610534668,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,EliminateDivs,0.016480684280395508,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TensorOpFusion,0.019669055938720703,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TensorOpTransform,0.08614420890808105,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LowerTensorOp,0.024866819381713867,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,MemcpyElimination,2.362525463104248,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DeadStoreElimination,1.66868257522583,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SimplifySlice,0.005608797073364258,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,PadElimination,0.0008716583251953125,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LoopFusion,1.1253650188446045,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,ValueNumbering,0.06372833251953125,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TCTransform,0.03502392768859863,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,CommuteConcat,0.02022075653076172,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,RecognizeOpIdiom,0.030136585235595703,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,MaskPropagation,0.021459341049194336,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,Recompute,0.0011527538299560547,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DoNothing,9.822845458984375e-05,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,MutateDataType,0.0048444271087646484,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,AutoCastTCInputs,0.00899815559387207,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,GenericAccessSimplifier,0.026137351989746094,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,Simplifier,0.9230337142944336,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,Delinearization,0.09181427955627441,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DelinearIndices,0.03810691833496094,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DeadCodeElimination,0.012696504592895508,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeCCOpLayout,0.00601959228515625,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,InferIntrinsicOnCC,0.11776328086853027,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,ResolveAccessConflict,0.056751251220703125,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LocalLayoutOpt,0.05041003227233887,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,GlobalLayoutOpt,1.0678589344024658,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,CanonicalizeDAG,0.014478206634521484,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,FlattenAxesForTiling,0.01801443099975586,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SundaSizeTiling,1.157806396484375,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,InferTongaTensor,0.4169459342956543,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,RewriteReplicationMatmul,0.013886213302612305,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DataLocalityOpt,2.7979495525360107,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TilingProfiler,0.017884492874145508,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeSundaMacro,0.046257734298706055,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,PerfectLoopNest,0.030710935592651367,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,RewriteWeights,1.030827283859253,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,ReshapeWeights,0.008022785186767578,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,FlattenMacroLoop,0.23689508438110352,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyPredicates,0.49019598960876465,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,InferInitValue,1.756650686264038,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaSimplifier,0.1537785530090332,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyTensor,0.06964278221130371,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LICM,0.20774054527282715,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SundaISel,0.49762630462646484,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaLoopFusion,0.3184328079223633,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,FactorizeBlkDims,0.13978266716003418,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaValueNumbering,0.05675053596496582,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaInstComb,0.22873902320861816,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeMatMult,0.005601167678833008,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeDMA,0.036812543869018555,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LegalizePartitionReduce,0.008343219757080078,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,PartialLoopFusion,0.3734281063079834,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LowerTranspose,0.08829855918884277,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LateTongaInstComb,0.25022029876708984,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LowerTongaBatchId,0.005396127700805664,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SplitAccGrp,0.008783102035522461,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SpillPSum,0.0793917179107666,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaLICM,0.09383869171142578,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,InferPSumTensor,0.1435384750366211,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,WeightCoalescing,0.032679080963134766,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LowerIntrinsics,0.007474660873413086,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeSundaAccess,0.05263018608093262,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaAffineLoopXform,0.026118993759155273,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,VectorizeAllReduce,0.00763702392578125,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,RelaxPredicates,0.01361393928527832,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TensorInitialization,0.007319927215576172,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,TongaSimplifyPredicates,0.02505016326904297,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,ExpandISAMacro,0.08680844306945801,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeType,0.023194313049316406,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SimplifyTongaTensor,0.03235292434692383,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DMALocalityOpt,0.006356239318847656,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DataStreaming,0.027247190475463867,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,PSUMModuloAlloc,0.6701242923736572,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,LegalizeStreamShuffle,0.008973360061645508,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,CoalesceCCOp,0.009181499481201172,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SimpleAllReduceTiling,0.008774042129516602,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,StaticProfiler,0.03323554992675781,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SplitAPUnionSets,0.12185835838317871,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,SundaLowerGenericAccess,0.01173710823059082,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,DumpGraphAndMetadata,0.02282428741455078,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg0000,Tensorizer,BirCodeGenLoop,0.32172155380249023,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,root,Tensorizer,All,22.195425987243652,Seconds
,bert-base-uncased_SWAG-neuronx,TPBCount,None,KELP,None,1,Count
,bert-base-uncased_SWAG-neuronx,CompilationTime,root,Frontend,0,23.157591104507446,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,all,Frontend,0,23.16165280342102,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg00,HHChecker,0,1.2636184692382812e-05,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,all,HHChecker,0,0.003998756408691406,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,sg00,WalrusDriver,0,1.8855173587799072,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,all,WalrusDriver,0,1.892042875289917,Seconds
,bert-base-uncased_SWAG-neuronx,EstimatedLowerBoundLatency,None,KELP,None,0,Milliseconds
,bert-base-uncased_SWAG-neuronx,EstimatedUpperBoundThroughput,None,KELP,None,0,Count/Second
,bert-base-uncased_SWAG-neuronx,InferentiaDRAMUsage,None,KELP,None,0,Bytes
,bert-base-uncased_SWAG-neuronx,CompilationTime,all,Kelper,0,4.728264331817627,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,root,Pipeline,0,29.805726766586304,Seconds
,bert-base-uncased_SWAG-neuronx,CompilationTime,all,production_total,None,29.785958766937256,Seconds