|
| 1 | +MNK,runtime,time_mean,time_std |
| 2 | +256,onnx2code-gemm-naive,2.93099801,0.21223372618581754 |
| 3 | +256,onnx2code-loop-tiling,0.6115743366666666,0.06599749912481524 |
| 4 | +256,onnx2code-libxsmm,0.6862000033333334,0.09256254610444041 |
| 5 | +256,tensorflow,0.83879467,0.2111202157956325 |
| 6 | +256,onnxruntime,0.17502199999999998,0.042453192844198025 |
| 7 | +288,onnx2code-gemm-naive,4.013051343333333,0.1922353570042171 |
| 8 | +288,onnx2code-loop-tiling,0.8613543366666666,0.08961090262274632 |
| 9 | +288,onnx2code-libxsmm,0.9549310066666667,0.115530932781052 |
| 10 | +288,tensorflow,0.9110693400000001,0.15713004746802695 |
| 11 | +288,onnxruntime,0.242907,0.06730584212632165 |
| 12 | +320,onnx2code-gemm-naive,5.73331939,0.27483905993038527 |
| 13 | +320,onnx2code-loop-tiling,1.1365396766666667,0.13217515031366067 |
| 14 | +320,onnx2code-libxsmm,1.2718516766666665,0.13979089496648958 |
| 15 | +320,tensorflow,1.1791876766666667,0.20658304444656664 |
| 16 | +320,onnxruntime,0.3266730033333333,0.05591295871724779 |
| 17 | +352,onnx2code-gemm-naive,7.659213810000001,0.31697362694935244 |
| 18 | +352,onnx2code-loop-tiling,1.4359520333333333,0.13807107627317253 |
| 19 | +352,onnx2code-libxsmm,1.7002643733333334,0.19519460629189345 |
| 20 | +352,tensorflow,1.4036383666666665,0.27107338265993375 |
| 21 | +352,onnxruntime,0.4308296766666666,0.09773607186690145 |
| 22 | +384,onnx2code-gemm-naive,11.107058206666666,1.4121811533334494 |
| 23 | +384,onnx2code-loop-tiling,1.8372090099999998,0.20677005859850672 |
| 24 | +384,onnx2code-libxsmm,2.311948676666667,0.25727827390834773 |
| 25 | +384,tensorflow,1.6829836733333334,0.2696682622089221 |
| 26 | +384,onnxruntime,0.538148,0.11062774047528344 |
| 27 | +416,onnx2code-gemm-naive,14.297038139999998,2.729676676434938 |
| 28 | +416,onnx2code-loop-tiling,2.4032359733333326,0.43364645287365833 |
| 29 | +416,onnx2code-libxsmm,2.9514771200000003,0.3241932617549172 |
| 30 | +416,tensorflow,2.00626849,0.322824547564065 |
| 31 | +416,onnxruntime,0.6981953366666667,0.14003255632503223 |
| 32 | +448,onnx2code-gemm-naive,17.374831833333335,0.6144123549041031 |
| 33 | +448,onnx2code-loop-tiling,2.872743363333333,0.2822886150100956 |
| 34 | +448,onnx2code-libxsmm,3.7628733766666667,0.41442373074013844 |
| 35 | +448,tensorflow,2.3588540266666667,0.3072846262026125 |
| 36 | +448,onnxruntime,0.8693563433333332,0.1435663590984048 |
| 37 | +480,onnx2code-gemm-naive,21.50225923,0.7819840128890342 |
| 38 | +480,onnx2code-loop-tiling,3.50825207,0.31527052039920433 |
| 39 | +480,onnx2code-libxsmm,4.428268086666667,0.42702809932715097 |
| 40 | +480,tensorflow,2.62927905,0.3265735363913425 |
| 41 | +480,onnxruntime,1.0414200200000001,0.19804321140402564 |
| 42 | +512,onnx2code-gemm-naive,34.906725013333336,2.4372404714513394 |
| 43 | +512,onnx2code-loop-tiling,4.392616076666666,0.34323584249067596 |
| 44 | +512,onnx2code-libxsmm,6.58534778,0.5006035942198693 |
| 45 | +512,tensorflow,3.917376396666667,0.6595506638626123 |
| 46 | +512,onnxruntime,1.2402080100000001,0.16426971820915917 |
| 47 | +544,onnx2code-gemm-naive,30.517709726666666,1.4655694722498689 |
| 48 | +544,onnx2code-loop-tiling,5.456461906666667,0.47872229454143655 |
| 49 | +544,onnx2code-libxsmm,6.595671356666667,0.6647671986123534 |
| 50 | +544,tensorflow,3.88902766,0.46820230109173716 |
| 51 | +544,onnxruntime,1.482888666666667,0.17757750778619336 |
| 52 | +576,onnx2code-gemm-naive,36.852594706666665,2.328737123134206 |
| 53 | +576,onnx2code-loop-tiling,6.3206076200000005,0.4519496564714359 |
| 54 | +576,onnx2code-libxsmm,7.905415273333334,0.6909014338298326 |
| 55 | +576,tensorflow,4.415751966666667,0.5194307622421865 |
| 56 | +576,onnxruntime,1.73132532,0.1933088669553924 |
| 57 | +608,onnx2code-gemm-naive,42.66949377666666,1.2014143562159671 |
| 58 | +608,onnx2code-loop-tiling,7.304635963333335,0.7251682138322634 |
| 59 | +608,onnx2code-libxsmm,9.214234646666666,0.778034726474529 |
| 60 | +608,tensorflow,5.144455656666667,0.5631055999529266 |
| 61 | +608,onnxruntime,2.047746663333333,0.1852386781655944 |
| 62 | +640,onnx2code-gemm-naive,55.89334453333334,2.273516001627766 |
| 63 | +640,onnx2code-loop-tiling,8.369001973333333,0.5048504896278362 |
| 64 | +640,onnx2code-libxsmm,11.598928710000001,0.9318555946571332 |
| 65 | +640,tensorflow,6.01065204,0.7255272663531527 |
| 66 | +640,onnxruntime,2.3855636833333334,0.2919221096476188 |
| 67 | +672,onnx2code-gemm-naive,58.554538380000004,2.8564249775566233 |
| 68 | +672,onnx2code-loop-tiling,9.613490160000001,0.6311975762601341 |
| 69 | +672,onnx2code-libxsmm,13.277355443333333,1.5214488973740832 |
| 70 | +672,tensorflow,6.44044367,0.6637398145560762 |
| 71 | +672,onnxruntime,2.745889,0.3140661292026463 |
| 72 | +704,onnx2code-gemm-naive,67.34064747000001,2.9076649778401698 |
| 73 | +704,onnx2code-loop-tiling,11.017596743333334,0.6963415985621837 |
| 74 | +704,onnx2code-libxsmm,14.665297196666664,1.2571258474802771 |
| 75 | +704,tensorflow,7.532525746666667,0.8175024675900715 |
| 76 | +704,onnxruntime,3.1209063366666667,0.30571192055678276 |
| 77 | +736,onnx2code-gemm-naive,77.81776146333333,3.994680527831363 |
| 78 | +736,onnx2code-loop-tiling,12.602153343333333,0.7199006589244326 |
| 79 | +736,onnx2code-libxsmm,17.260685663333334,1.3552461221698675 |
| 80 | +736,tensorflow,8.18517155,0.8955714304885909 |
| 81 | +736,onnxruntime,3.4846302700000003,0.29393547805562775 |
| 82 | +768,onnx2code-gemm-naive,114.22778595999999,8.203709334359631 |
| 83 | +768,onnx2code-loop-tiling,14.643412720000002,0.770094425828583 |
| 84 | +768,onnx2code-libxsmm,21.88221372,2.3626316578265025 |
| 85 | +768,tensorflow,9.402519983333335,1.0571307250323347 |
| 86 | +768,onnxruntime,3.9847046133333333,0.35216399742038346 |
| 87 | +800,onnx2code-gemm-naive,102.52447922666666,4.841998191757737 |
| 88 | +800,onnx2code-loop-tiling,16.721700436666666,0.7321350723210706 |
| 89 | +800,onnx2code-libxsmm,22.56168299333333,1.5385892624864095 |
| 90 | +800,tensorflow,10.610878073333334,1.2925829745715158 |
| 91 | +800,onnxruntime,4.526122559999999,0.394388227185878 |
| 92 | +832,onnx2code-gemm-naive,118.56218002333335,3.939953692180838 |
| 93 | +832,onnx2code-loop-tiling,18.922631803333335,1.4425692216179269 |
| 94 | +832,onnx2code-libxsmm,25.1037305,3.1527200230313914 |
| 95 | +832,tensorflow,11.518043606666668,1.147024838134664 |
| 96 | +832,onnxruntime,5.080414686666666,0.47586088191467807 |
| 97 | +864,onnx2code-gemm-naive,130.09689659666668,5.189265473084857 |
| 98 | +864,onnx2code-loop-tiling,20.914084600000002,0.9556391532755657 |
| 99 | +864,onnx2code-libxsmm,29.258843553333328,1.9307758241843858 |
| 100 | +864,tensorflow,13.143729653333333,2.0231548745389447 |
| 101 | +864,onnxruntime,5.760477336666666,1.477134492618634 |
| 102 | +896,onnx2code-gemm-naive,168.89975199666668,5.312927351664043 |
| 103 | +896,onnx2code-loop-tiling,23.185644933333332,1.0045551482742974 |
| 104 | +896,onnx2code-libxsmm,34.172522423333334,1.9982843256822413 |
| 105 | +896,tensorflow,14.184290020000002,1.8862201389964413 |
| 106 | +896,onnxruntime,6.194402336666667,0.5051867525439248 |
| 107 | +928,onnx2code-gemm-naive,165.13455939666667,3.6329771619842033 |
| 108 | +928,onnx2code-loop-tiling,25.830488803333335,1.6850606511951327 |
| 109 | +928,onnx2code-libxsmm,37.66786822666667,3.800566116722251 |
| 110 | +928,tensorflow,15.979504666666665,1.5224369501662662 |
| 111 | +928,onnxruntime,6.822730663333334,0.8137015051617086 |
| 112 | +960,onnx2code-gemm-naive,183.91971043000004,3.7863765477388824 |
| 113 | +960,onnx2code-loop-tiling,27.901448323333334,1.140211974885468 |
| 114 | +960,onnx2code-libxsmm,40.32194981999999,4.608950302465135 |
| 115 | +960,tensorflow,17.55200400333333,3.1222178969760126 |
| 116 | +960,onnxruntime,7.582337316666665,1.3798306560698488 |
| 117 | +992,onnx2code-gemm-naive,202.18115277666666,4.9461951688977575 |
| 118 | +992,onnx2code-loop-tiling,30.831881576666667,1.2410191207267294 |
| 119 | +992,onnx2code-libxsmm,46.472281063333334,3.5206640553037913 |
| 120 | +992,tensorflow,19.609973956666668,1.9594430432812078 |
| 121 | +992,onnxruntime,8.354810469999999,1.224331820426381 |
| 122 | +1024,onnx2code-gemm-naive,311.7934103333333,6.877924793102408 |
| 123 | +1024,onnx2code-loop-tiling,34.00422953666667,1.65053201542282 |
| 124 | +1024,onnx2code-libxsmm,56.044168510000006,4.313170511153236 |
| 125 | +1024,tensorflow,21.53622228,3.0112313016520313 |
| 126 | +1024,onnxruntime,9.185121386666667,1.5104097708390252 |
| 127 | +1056,onnx2code-gemm-naive,254.14210583000002,6.641041915904256 |
| 128 | +1056,onnx2code-loop-tiling,38.359650099999996,1.305478721310599 |
| 129 | +1056,onnx2code-libxsmm,59.21067334000001,4.997676490874754 |
| 130 | +1056,tensorflow,22.382056223333333,2.0500099528156066 |
| 131 | +1056,onnxruntime,9.777039993333332,0.7107724979235902 |
| 132 | +1088,onnx2code-gemm-naive,292.2926318666667,9.702008574620628 |
| 133 | +1088,onnx2code-loop-tiling,42.027352369999996,1.749770538149051 |
| 134 | +1088,onnx2code-libxsmm,67.41834954333333,4.8664865627514065 |
| 135 | +1088,tensorflow,26.594176163333334,2.0905433452247073 |
| 136 | +1088,onnxruntime,10.497412073333331,0.8809854735765934 |
| 137 | +1120,onnx2code-gemm-naive,338.5233844933333,10.164223333108087 |
| 138 | +1120,onnx2code-loop-tiling,45.16896703,2.3841331282466762 |
| 139 | +1120,onnx2code-libxsmm,76.79927917333333,5.7278331098052515 |
| 140 | +1120,tensorflow,28.83353773333333,2.563366119458253 |
| 141 | +1120,onnxruntime,11.659171516666666,1.8744377435576556 |
| 142 | +1152,onnx2code-gemm-naive,403.66976146333326,9.52804313250809 |
| 143 | +1152,onnx2code-loop-tiling,49.305075323333334,3.73440690467644 |
| 144 | +1152,onnx2code-libxsmm,86.43004374333333,6.511510521143248 |
| 145 | +1152,tensorflow,30.32093784666667,2.2242678975026324 |
| 146 | +1152,onnxruntime,12.255513253333332,0.9498209524135391 |
| 147 | +1184,onnx2code-gemm-naive,416.8149896066667,16.73399445325064 |
| 148 | +1184,onnx2code-loop-tiling,53.818254503333335,4.412354834290176 |
| 149 | +1184,onnx2code-libxsmm,95.98643558,6.660626441719355 |
| 150 | +1184,tensorflow,32.997734083333334,3.954762346023894 |
| 151 | +1184,onnxruntime,13.61072438,0.9931182019533201 |
| 152 | +1216,onnx2code-gemm-naive,449.9982161666666,11.71757127478388 |
| 153 | +1216,onnx2code-loop-tiling,57.79504892,3.78510541217508 |
| 154 | +1216,onnx2code-libxsmm,113.02410599,6.211236515543298 |
| 155 | +1216,tensorflow,33.57050304333334,3.4069599306920897 |
| 156 | +1216,onnxruntime,14.462370676666664,1.1351487701683944 |
| 157 | +1248,onnx2code-gemm-naive,533.9181180966667,19.01682602485039 |
| 158 | +1248,onnx2code-loop-tiling,61.468259516666656,2.3679392876943126 |
| 159 | +1248,onnx2code-libxsmm,128.34663120999997,6.3470097444951215 |
| 160 | +1248,tensorflow,36.713297913333335,2.8748869668129955 |
| 161 | +1248,onnxruntime,15.35723634,1.0219832136925788 |
0 commit comments