Advertisement
Guest User

Untitled

a guest
Sep 20th, 2019
118
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 59.79 KB | None | 0 0
  1. # Runtime Features
  2. 0. BLAS_APPLE : ✖ BLAS_APPLE
  3. 0. BLAS_ATLAS : ✖ BLAS_ATLAS
  4. 0. BLAS_MKL : ✖ BLAS_MKL
  5. 0. BLAS_OPEN : ✔ BLAS_OPEN
  6. 0. CAFFE : ✖ CAFFE
  7. 0. CPU_AVX : ✔ CPU_AVX
  8. 0. CPU_AVX2 : ✖ CPU_AVX2
  9. 0. CPU_SSE : ✔ CPU_SSE
  10. 0. CPU_SSE2 : ✔ CPU_SSE2
  11. 0. CPU_SSE3 : ✔ CPU_SSE3
  12. 0. CPU_SSE4A : ✖ CPU_SSE4A
  13. 0. CPU_SSE4_1 : ✔ CPU_SSE4_1
  14. 0. CPU_SSE4_2 : ✔ CPU_SSE4_2
  15. 0. CUDA : ✖ CUDA
  16. 0. CUDA_RTC : ✖ CUDA_RTC
  17. 0. CUDNN : ✖ CUDNN
  18. 0. CXX14 : ✖ CXX14
  19. 0. DEBUG : ✖ DEBUG
  20. 0. DIST_KVSTORE : ✖ DIST_KVSTORE
  21. 0. F16C : ✔ F16C
  22. 0. INT64_TENSOR_SIZE : ✖ INT64_TENSOR_SIZE
  23. 0. JEMALLOC : ✖ JEMALLOC
  24. 0. LAPACK : ✔ LAPACK
  25. 0. MKLDNN : ✖ MKLDNN
  26. 0. NCCL : ✖ NCCL
  27. 0. OPENCV : ✖ OPENCV
  28. 0. OPENMP : ✔ OPENMP
  29. 0. PROFILER : ✖ PROFILER
  30. 0. SIGNAL_HANDLER : ✖ SIGNAL_HANDLER
  31. 0. SSE : ✖ SSE
  32. 0. TENSORRT : ✖ TENSORRT
  33. 0. TVM_OP : ✖ TVM_OP
  34. # Benchmark Results
  35. | Operator | Avg Time (ms) | P50 Time (ms) | P90 Time (ms) | P99 Time (ms) | Inputs |
  36. | :---: | :---: | :---: | :---: | :---: | :---: |
  37. | BatchNorm | 18.313633010839112 | 18.30739449360408 | 18.39710977510549 | 18.591279740212496 | {'data': (32, 3, 256, 256), 'gamma': (3,), 'beta': (3,), 'moving_mean': (3,), 'moving_var': (3,)} |
  38. | BatchNorm | 37.95068456791341 | 38.154728506924585 | 38.21642779512331 | 38.2942253665533 | {'data': (32, 3, 10000, 10), 'gamma': (3,), 'beta': (3,), 'moving_mean': (3,), 'moving_var': (3,)} |
  39. | BlockGrad | 1.4952558028744534 | 1.4942825073376298 | 1.5214132494293153 | 1.535775777883828 | {'data': (1024, 1024)} |
  40. | BlockGrad | 0.03530186717398465 | 0.034639990190044045 | 0.03528897650539876 | 0.04986266372725375 | {'data': (10000, 1)} |
  41. | BlockGrad | 1.4428811921970919 | 1.4465769927483052 | 1.5089457214344293 | 1.518197794794105 | {'data': (10000, 100)} |
  42. | Convolution | 6.226346398470923 | 6.2347049824893475 | 6.253477482823655 | 6.266250924672931 | {'data': (32, 3, 256), 'weight': (64, 3, 3), 'bias': (64,), 'kernel': (3,), 'stride': (1,), 'dilate': (1,), 'pad': (0,), 'num_filter': 64, 'layout': 'NCW'} |
  43. | Deconvolution | 7.434120944235474 | 7.432792510371655 | 7.512046629562974 | 7.56524161726702 | {'data': (32, 3, 256), 'weight': (3, 64, 3), 'bias': (64,), 'kernel': (3,), 'stride': (1,), 'dilate': (1,), 'pad': (0,), 'adj': (0,), 'num_filter': 64, 'no_bias': False, 'layout': 'NCW'} |
  44. | Dropout | 8.825434681493789 | 9.538002515910193 | 9.669515170389786 | 9.711648562224582 | {'data': (32, 3, 256, 256), 'p': 0.5, 'mode': 'always'} |
  45. | Dropout | 0.29045442992355675 | 0.2849095035344362 | 0.29633100493811076 | 0.3439964714925752 | {'data': (10000, 10), 'p': 0.5, 'mode': 'always'} |
  46. | FullyConnected | 104.99763897212688 | 105.00158902141266 | 105.27298070373945 | 105.51776159729343 | {'data': (32, 3, 256, 256), 'num_hidden': 64, 'weight': (64, 196608), 'bias': (64,), 'flatten': True} |
  47. | FullyConnected | 46.593356058583595 | 46.455940522719175 | 47.0770200015977 | 48.33531428361317 | {'data': (32, 3, 256, 256), 'num_hidden': 64, 'weight': (64, 256), 'bias': (64,), 'flatten': False} |
  48. | LeakyReLU | 0.3115620563039556 | 0.3099369932897389 | 0.32007485278882086 | 0.3278291027527304 | {'data': (1024, 1024), 'act_type': 'leaky', 'slope': 0.1} |
  49. | LeakyReLU | 0.20442567067220807 | 0.20300049800425768 | 0.20749933901242912 | 0.23426922911312437 | {'data': (10000, 1), 'act_type': 'leaky', 'slope': 0.1} |
  50. | LeakyReLU | 0.2993507409701124 | 0.2967409964185208 | 0.3051422943826765 | 0.3744153521256523 | {'data': (10000, 100), 'act_type': 'leaky', 'slope': 0.1} |
  51. | LeakyReLU | 1.6231002827407792 | 1.6249394975602627 | 1.6522664984222502 | 1.700355393695645 | {'data': (1024, 1024), 'act_type': 'elu', 'slope': 0.1} |
  52. | LeakyReLU | 0.23089678026735783 | 0.22918797913007438 | 0.23673013201914728 | 0.24977984197903444 | {'data': (10000, 1), 'act_type': 'elu', 'slope': 0.1} |
  53. | LeakyReLU | 0.6168936082394794 | 0.6134965224191546 | 0.6252045044675469 | 0.6760416034376251 | {'data': (10000, 100), 'act_type': 'elu', 'slope': 0.1} |
  54. | LeakyReLU | 1.6051644057733938 | 1.6120535146910697 | 1.6396583057940006 | 1.666092865052633 | {'data': (1024, 1024), 'act_type': 'selu'} |
  55. | LeakyReLU | 0.22496317222248763 | 0.22314550005830824 | 0.2321725187357515 | 0.24429241893813028 | {'data': (10000, 1), 'act_type': 'selu'} |
  56. | LeakyReLU | 0.6097522203344852 | 0.6072960095480084 | 0.620476488256827 | 0.6360733701149003 | {'data': (10000, 100), 'act_type': 'selu'} |
  57. | LeakyReLU | 3.2636905781691894 | 3.28320698463358 | 3.326876839855686 | 3.3614499925170094 | {'data': (1024, 1024), 'act_type': 'prelu', 'gamma': (1, 1024)} |
  58. | LeakyReLU | 0.3463137795915827 | 0.3441014850977808 | 0.35500116646289825 | 0.3663692984264345 | {'data': (10000, 1), 'act_type': 'prelu', 'gamma': (1, 1)} |
  59. | LeakyReLU | 2.8227887477260083 | 2.813424012856558 | 2.910937712294981 | 2.9731572733726352 | {'data': (10000, 100), 'act_type': 'prelu', 'gamma': (1, 100)} |
  60. | Pooling | 0.44675390468910336 | 0.44523098040372133 | 0.45442780246958137 | 0.4623096209252253 | {'data': (32, 3, 256), 'kernel': 3, 'pool_type': 'avg', 'global_pool': 0, 'stride': 1, 'pad': 1} |
  61. | abs | 0.30018259189091623 | 0.27917601983062923 | 0.2915823191870004 | 0.9413014142774078 | {'data': (1024, 1024)} |
  62. | abs | 0.13609811896458268 | 0.13382500037550926 | 0.14182921731844547 | 0.1720652612857522 | {'data': (10000, 1)} |
  63. | abs | 0.29367450275458395 | 0.2732864813879132 | 0.2824523311574012 | 0.8990391832776402 | {'data': (10000, 100)} |
  64. | adam_update | 0.34745052515063435 | 0.3448499774094671 | 0.35662600421346724 | 0.37285631056875 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'mean': (1024, 1024), 'var': (1024, 1024), 'lr': 0.1, 'beta1': 0.1, 'beta2': 0.1, 'epsilon': 1e-08, 'rescale_grad': 0.4, 'lazy_update': 0} |
  65. | adam_update | 0.09181945293676108 | 0.08076502126641572 | 0.08445210987702012 | 0.5322693608468406 | {'weight': (10000, 1), 'grad': (10000, 1), 'mean': (10000, 1), 'var': (10000, 1), 'lr': 0.5, 'beta1': 0.5, 'beta2': 0.5, 'epsilon': 1e-08, 'rescale_grad': 0.4, 'lazy_update': 0} |
  66. | adam_update | 0.4338180704507977 | 0.3794344956986606 | 0.6274563784245403 | 0.7292997551849112 | {'weight': (10000, 100), 'grad': (10000, 100), 'mean': (10000, 100), 'var': (10000, 100), 'lr': 0.9, 'beta1': 0.9, 'beta2': 0.9, 'epsilon': 1e-08, 'rescale_grad': 0.4, 'lazy_update': 0} |
  67. | arccos | 1.0153253615135327 | 0.9993000130634755 | 1.009789714589715 | 1.6450840962352236 | {'data': (1024, 1024)} |
  68. | arccos | 0.18725544679909945 | 0.18566250219009817 | 0.19209347665309906 | 0.21889669937081652 | {'data': (10000, 1)} |
  69. | arccos | 0.9705644194036722 | 0.954272982198745 | 0.9670434810686857 | 1.5226267662365 | {'data': (10000, 100)} |
  70. | arccosh | 1.0428956151008606 | 1.026564510539174 | 1.0395188117399812 | 1.6523843735922132 | {'data': (1024, 1024)} |
  71. | arccosh | 0.1761078689014539 | 0.17519501852802932 | 0.17900621751323342 | 0.19536456791684034 | {'data': (10000, 1)} |
  72. | arccosh | 0.9962721302872524 | 0.9802384884096682 | 0.9912115638144314 | 1.614464087761008 | {'data': (10000, 100)} |
  73. | arcsin | 1.1356739659095183 | 0.9827050089370459 | 1.0459705721586943 | 5.198463420965733 | {'data': (1024, 1024)} |
  74. | arcsin | 0.21745430422015488 | 0.19695900846272707 | 0.20400768844410777 | 0.4209688515402451 | {'data': (10000, 1)} |
  75. | arcsin | 0.952649338869378 | 0.9363345161546022 | 0.9473574231378734 | 1.5808601735625425 | {'data': (10000, 100)} |
  76. | arcsinh | 1.4123814512277022 | 1.394841994624585 | 1.408784999512136 | 2.032203279086389 | {'data': (1024, 1024)} |
  77. | arcsinh | 0.15720238792710006 | 0.15579251339659095 | 0.1597996917553246 | 0.1764877280220391 | {'data': (10000, 1)} |
  78. | arcsinh | 1.35093764110934 | 1.336168497800827 | 1.3449881866108626 | 2.016429853974842 | {'data': (10000, 100)} |
  79. | arctan | 0.7451857253909111 | 0.7255024975165725 | 0.7552001858130097 | 1.3706932071363556 | {'data': (1024, 1024)} |
  80. | arctan | 0.12353285623248667 | 0.12086352217011154 | 0.1252405229024589 | 0.15026176348328668 | {'data': (10000, 1)} |
  81. | arctan | 0.7261816784739494 | 0.7166980067268014 | 0.7410447346046567 | 1.3806071970611815 | {'data': (10000, 100)} |
  82. | arctanh | 1.0189429036108777 | 0.9988179954234511 | 1.025452493922785 | 1.6245333245024092 | {'data': (1024, 1024)} |
  83. | arctanh | 0.12189498054794967 | 0.11981799616478384 | 0.12328621232882142 | 0.1469759503379469 | {'data': (10000, 1)} |
  84. | arctanh | 0.9916196181438863 | 0.9736335196066648 | 0.9997191024012864 | 1.6630542866187175 | {'data': (10000, 100)} |
  85. | argmax | 9.495754671515897 | 7.56606349023059 | 12.150796095374972 | 12.481605882639997 | {'data': (1024, 1024), 'axis': 0} |
  86. | argmax | 0.08755001123063266 | 0.08664902998134494 | 0.08848840952850878 | 0.10592885024379953 | {'data': (10000, 1), 'axis': 0} |
  87. | argmax | 4.774968061828986 | 4.765146994031966 | 4.779584420612082 | 5.148953440948395 | {'data': (10000, 100), 'axis': 0} |
  88. | argmax_channel | 0.252590870950371 | 0.2513630024623126 | 0.25661211111582816 | 0.26856422307901084 | {'data': (1024, 1024)} |
  89. | argmax_channel | 0.05253606825135648 | 0.05133703234605491 | 0.053086911793798215 | 0.09328770625870679 | {'data': (10000, 1)} |
  90. | argmax_channel | 0.2631993911927566 | 0.2618970174808055 | 0.2701087505556643 | 0.27509026927873503 | {'data': (10000, 100)} |
  91. | argmin | 8.344157298561186 | 7.553609524620697 | 12.345996918156743 | 12.395493421354331 | {'data': (1024, 1024), 'axis': 0} |
  92. | argmin | 0.08724255952984095 | 0.08638147846795619 | 0.08762689540162683 | 0.10443798848427846 | {'data': (10000, 1), 'axis': 0} |
  93. | argmin | 4.779016597894952 | 4.774890490807593 | 4.785594117129222 | 5.0593120278790655 | {'data': (10000, 100), 'axis': 0} |
  94. | argsort | 20.727770794765092 | 20.494411495747045 | 20.609241392230615 | 26.542324459878728 | {'data': (1024, 1024), 'axis': 0} |
  95. | argsort | 0.8498476014938205 | 0.8472595072817057 | 0.8598424377851188 | 0.8696252229856328 | {'data': (10000, 1), 'axis': 0} |
  96. | argsort | 16.487408822285943 | 16.438968013972044 | 16.45129984826781 | 17.77653526281939 | {'data': (10000, 100), 'axis': 0} |
  97. | batch_dot | 3324.3811008310877 | 2264.345121977385 | 7083.653557801154 | 8983.74359956128 | {'lhs': (32, 1024, 1024), 'rhs': (32, 1024, 1024)} |
  98. | batch_dot | 2036.5331345563754 | 2052.3844420094974 | 2062.600179592846 | 2078.7908131227596 | {'lhs': (32, 1000, 10), 'rhs': (32, 1000, 10), 'transpose_b': True} |
  99. | batch_dot | 7.841857359744608 | 7.412014005240053 | 8.558496972545981 | 15.771587187773559 | {'lhs': (32, 1000, 1), 'rhs': (32, 100, 1000), 'transpose_a': True, 'transpose_b': True} |
  100. | broadcast_add | 0.24796352081466466 | 0.22486550733447075 | 0.2429456973914057 | 0.8810479420935773 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  101. | broadcast_add | 0.25736386014614254 | 0.25490749976597726 | 0.263956340495497 | 0.2974446828011428 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  102. | broadcast_add | 0.15241757268086076 | 0.15058901044540107 | 0.15816755476407707 | 0.1753999874927106 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  103. | broadcast_div | 0.2765837428160012 | 0.2574165118858218 | 0.26501420652493834 | 0.8891873760148913 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  104. | broadcast_div | 0.18847630301024765 | 0.18613351858220994 | 0.19565682159736753 | 0.22302395256701876 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  105. | broadcast_div | 0.16752495255786926 | 0.16540152137167752 | 0.173196621472016 | 0.1919684937456625 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  106. | broadcast_equal | 0.0693412497639656 | 0.06766198202967644 | 0.07100407383404672 | 0.11357285955455161 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  107. | broadcast_equal | 0.060607611667364836 | 0.059619516832754016 | 0.06351948250085115 | 0.07424216601066301 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  108. | broadcast_equal | 0.05071879597380757 | 0.0501224712934345 | 0.05090097547508776 | 0.06048237788490956 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  109. | broadcast_greater | 0.06739519536495209 | 0.06557852611877024 | 0.07295301766134799 | 0.09667362086474901 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  110. | broadcast_greater | 0.06123604194726795 | 0.060006510466337204 | 0.06383220897987488 | 0.08227484009694314 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  111. | broadcast_greater | 0.05048446997534484 | 0.04991897731088102 | 0.05063812714070082 | 0.06735570379532874 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  112. | broadcast_greater_equal | 0.06858992914203554 | 0.06698849028907716 | 0.07412192644551398 | 0.08456468232907356 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  113. | broadcast_greater_equal | 0.0612393394112587 | 0.06045849295333028 | 0.06368086906149983 | 0.08857056964188816 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  114. | broadcast_greater_equal | 0.050851337728090584 | 0.05018000956624746 | 0.05079847760498524 | 0.06891493510920563 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  115. | broadcast_hypot | 0.9863157814834267 | 0.965763523709029 | 0.9842249855864793 | 1.6215943230781726 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  116. | broadcast_hypot | 0.23089523136150092 | 0.22963748779147863 | 0.23892831522971392 | 0.24974003667011874 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  117. | broadcast_hypot | 0.4068673017900437 | 0.43578448821790516 | 0.4510889935772866 | 0.4696108686039229 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  118. | broadcast_lesser | 0.07531550945714116 | 0.07341147284023464 | 0.08006297866813838 | 0.10534552216995516 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  119. | broadcast_lesser | 0.05309912608936429 | 0.05234152195043862 | 0.054681708570569754 | 0.0766715069767089 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  120. | broadcast_lesser | 0.04132356203626841 | 0.0404869788326323 | 0.04146838327869773 | 0.05544367129914471 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  121. | broadcast_lesser_equal | 0.06480687123257667 | 0.06376649253070354 | 0.06701863603666425 | 0.0885962793836371 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  122. | broadcast_lesser_equal | 0.05871665256563574 | 0.05764549132436514 | 0.06103769992478193 | 0.0760116800665856 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  123. | broadcast_lesser_equal | 0.046627658884972334 | 0.04603699198924005 | 0.04669731133617461 | 0.061619681655429324 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  124. | broadcast_logical_and | 0.06829977093730122 | 0.06727798609063029 | 0.07048980914987624 | 0.08565696247387683 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  125. | broadcast_logical_and | 0.056663972209207714 | 0.0561330234631896 | 0.05906159058213234 | 0.07171419449150568 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  126. | broadcast_logical_and | 0.053106172126717865 | 0.05271850386634469 | 0.05336711765266955 | 0.06548180652316661 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  127. | broadcast_logical_or | 0.06729018117766827 | 0.06651500007137656 | 0.06923437467776239 | 0.08395779703278096 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  128. | broadcast_logical_or | 0.05655490036588162 | 0.055836018873378634 | 0.0588238995987922 | 0.07073695829603828 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  129. | broadcast_logical_or | 0.05397163098677993 | 0.053614494390785694 | 0.054216483840718865 | 0.06465684564318509 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  130. | broadcast_logical_xor | 0.1739562297007069 | 0.17285349895246327 | 0.17693880363367498 | 0.18855369999073449 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  131. | broadcast_logical_xor | 0.06314520258456469 | 0.06263947580009699 | 0.06494201370514929 | 0.07473545265384021 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  132. | broadcast_logical_xor | 0.06162970094010234 | 0.06116749136708677 | 0.06182031938806176 | 0.07095346401911233 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  133. | broadcast_maximum | 0.2670747140655294 | 0.2468364837113768 | 0.2559980843216181 | 0.8910152595490248 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  134. | broadcast_maximum | 0.1844577194424346 | 0.18259949865750968 | 0.19054727745242417 | 0.2260852407198401 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  135. | broadcast_maximum | 0.1627115812152624 | 0.16136953490786254 | 0.1676132087595761 | 0.18139621941372774 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  136. | broadcast_minimum | 0.26594831026159227 | 0.24565501371398568 | 0.25699299294501543 | 0.9122870594728766 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  137. | broadcast_minimum | 0.18404138972982764 | 0.18228849512524903 | 0.1885324832983315 | 0.22256336058489998 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  138. | broadcast_minimum | 0.16362516209483147 | 0.1615759974811226 | 0.16868181992322206 | 0.18729942617937945 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  139. | broadcast_minus | 0.07626174192409962 | 0.07482152432203293 | 0.07900789496488869 | 0.10384424182120713 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  140. | broadcast_minus | 0.11766721494495869 | 0.11909502791240811 | 0.12168526882305745 | 0.1672468351898716 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  141. | broadcast_minus | 0.03962149261496961 | 0.038555997889488935 | 0.0432480184827 | 0.05259863566607243 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  142. | broadcast_mod | 1.7202818393707275 | 1.6371594683732837 | 1.7839077627286315 | 3.3539004216436297 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  143. | broadcast_mod | 0.4308364784810692 | 0.42869048775173724 | 0.43984647491015494 | 0.4607384302653373 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  144. | broadcast_mod | 0.18445874913595617 | 0.1739785075187683 | 0.21140497410669923 | 0.24245642824098482 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  145. | broadcast_mul | 0.2925583306932822 | 0.26998997782357037 | 0.2936248842161149 | 0.8094485983019727 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  146. | broadcast_mul | 0.2701892954064533 | 0.2670385001692921 | 0.2784956246614456 | 0.3015698195667941 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  147. | broadcast_mul | 0.15342347731348127 | 0.15144702047109604 | 0.157531799050048 | 0.173257308197208 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  148. | broadcast_not_equal | 0.06679503771010786 | 0.06568251410499215 | 0.06812058854848146 | 0.08543448289856327 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  149. | broadcast_not_equal | 0.0568884116364643 | 0.055384967708960176 | 0.06539840251207352 | 0.07125782081857329 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  150. | broadcast_not_equal | 0.05118060333188623 | 0.050452013965696096 | 0.051922135753557086 | 0.06370240065734836 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  151. | broadcast_plus | 0.06627624796237797 | 0.06496848072856665 | 0.06761479889973998 | 0.0989680172642694 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  152. | broadcast_plus | 0.09882695914711803 | 0.09758200030773878 | 0.09831367642618716 | 0.12740517093334353 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  153. | broadcast_plus | 0.04238171852193773 | 0.04441398777998984 | 0.04553121980279684 | 0.05129080265760427 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  154. | broadcast_power | 6.466223181341775 | 6.461356504587457 | 6.488376023480669 | 6.59264532267116 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  155. | broadcast_power | 0.7727029005764052 | 0.717356480890885 | 0.7275094103533775 | 0.7868484710343456 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  156. | broadcast_power | 0.21605570509564131 | 0.20965500152669847 | 0.21944900508970022 | 0.246844448265622 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  157. | broadcast_sub | 0.24336743808817118 | 0.22088049445301294 | 0.23409047862514853 | 0.8967068057972974 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  158. | broadcast_sub | 0.2438928058836609 | 0.24160899920389056 | 0.251661118818447 | 0.28768861084245173 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  159. | broadcast_sub | 0.1505346322664991 | 0.1488559937570244 | 0.15415151719935238 | 0.1709596754517409 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  160. | cbrt | 1.4946453046286479 | 1.0537869820836931 | 1.0851217375602573 | 18.655183704686387 | {'data': (1024, 1024)} |
  161. | cbrt | 0.12854980013798922 | 0.12485799379646778 | 0.13221591943874958 | 0.17027305962983613 | {'data': (10000, 1)} |
  162. | cbrt | 1.0894027352333069 | 1.021071511786431 | 1.0489502165000886 | 1.7370466119610035 | {'data': (10000, 100)} |
  163. | ceil | 0.10102776810526848 | 0.09962852345779538 | 0.10116079938597977 | 0.129540221532807 | {'data': (1024, 1024)} |
  164. | ceil | 0.05276404146570712 | 0.05225301720201969 | 0.052821915596723557 | 0.0654795684386045 | {'data': (10000, 1)} |
  165. | ceil | 0.09839981852564961 | 0.09743249393068254 | 0.09977330919355154 | 0.12447975226677957 | {'data': (10000, 100)} |
  166. | cos | 0.804903099196963 | 0.788036035373807 | 0.7998066605068743 | 1.4323595096357173 | {'data': (1024, 1024)} |
  167. | cos | 0.21482747048139572 | 0.21356053184717894 | 0.21967239445075393 | 0.23354497388936588 | {'data': (10000, 1)} |
  168. | cos | 0.7716745010111481 | 0.753509026253596 | 0.7665235607419163 | 1.4094880188349648 | {'data': (10000, 100)} |
  169. | cosh | 1.8983367725741118 | 1.8852815264835954 | 1.8952846876345575 | 2.4901406757999216 | {'data': (1024, 1024)} |
  170. | cosh | 0.13161042239516973 | 0.12994749704375863 | 0.1347702112980187 | 0.1554036966990681 | {'data': (10000, 1)} |
  171. | cosh | 1.815156587981619 | 1.8002224969677627 | 1.811521191848442 | 2.458659917465412 | {'data': (10000, 100)} |
  172. | degrees | 0.1502796378917992 | 0.1298824790865183 | 0.1338290865533054 | 0.7807160512311418 | {'data': (1024, 1024)} |
  173. | degrees | 0.11945643636863679 | 0.1178164966404438 | 0.1214133168105036 | 0.15308132453355947 | {'data': (10000, 1)} |
  174. | degrees | 0.14633870217949152 | 0.12517248978838325 | 0.12835157103836536 | 0.8171775640221349 | {'data': (10000, 100)} |
  175. | depth_to_space | 0.0726869102800265 | 0.07185348658822477 | 0.07425349904224277 | 0.08854205952957295 | {'data': (1, 4, 2, 4), 'block_size': 2} |
  176. | depth_to_space | 0.2524156140862033 | 0.2509769983589649 | 0.2576935919933021 | 0.2715162129607052 | {'data': (10, 25, 10, 100), 'block_size': 5} |
  177. | dot | 9.879384484956972 | 9.32183550321497 | 9.522688324796036 | 12.122057244996839 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  178. | dot | 3.8089211186161265 | 3.7930920370854437 | 3.8218701956793666 | 4.491224493831397 | {'lhs': (1000, 10), 'rhs': (1000, 10), 'transpose_b': True} |
  179. | dot | 0.32580989762209356 | 0.3212355077266693 | 0.33361519454047084 | 0.4042876412859193 | {'lhs': (1000, 1), 'rhs': (100, 1000), 'transpose_a': True, 'transpose_b': True} |
  180. | elemwise_add | 0.06878519430756569 | 0.06772999768145382 | 0.07008221582509577 | 0.09913676185533409 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  181. | elemwise_add | 0.10224876808933914 | 0.10082600056193769 | 0.1018941926304251 | 0.14147251669783165 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  182. | elemwise_add | 0.04413039539940655 | 0.04143800470046699 | 0.0482055707834661 | 0.05571061803493654 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  183. | elemwise_div | 0.06705681094899774 | 0.0663139799144119 | 0.06879100110381842 | 0.08412035822402687 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  184. | elemwise_div | 0.058099800371564925 | 0.057572993682697415 | 0.060095504159107804 | 0.07715175393968822 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  185. | elemwise_div | 0.04912031639833003 | 0.048647983931005 | 0.04960458027198911 | 0.05665308097377423 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  186. | elemwise_mul | 0.06856216234154999 | 0.0673640170134604 | 0.07140047382563353 | 0.0912931299535558 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  187. | elemwise_mul | 0.10060931963380426 | 0.09927450446411967 | 0.10093468590639532 | 0.1415709219872953 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  188. | elemwise_mul | 0.04405227315146476 | 0.045389519073069096 | 0.04718679119832814 | 0.052764586871489966 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  189. | elemwise_sub | 0.06974529940634966 | 0.0685674895066768 | 0.07163088885135949 | 0.08920532593037943 | {'lhs': (1024, 1024), 'rhs': (1024, 1024)} |
  190. | elemwise_sub | 0.10203705984167755 | 0.10021001799032092 | 0.10193792986683547 | 0.14359444670844843 | {'lhs': (10000, 10), 'rhs': (10000, 10)} |
  191. | elemwise_sub | 0.043908170773647726 | 0.04335603443905711 | 0.04733320092782378 | 0.05242263956461108 | {'lhs': (10000, 1), 'rhs': (10000, 1)} |
  192. | erf | 1.4989157498348504 | 1.360700000077486 | 1.3731223181821406 | 4.030498290085271 | {'data': (1024, 1024)} |
  193. | erf | 0.23320369073189795 | 0.23156247334554791 | 0.2393866772763431 | 0.2517211821395905 | {'data': (10000, 1)} |
  194. | erf | 1.3062428298871964 | 1.2903014721814543 | 1.3091098167933524 | 2.0276389777427544 | {'data': (10000, 100)} |
  195. | erfinv | 5.519544942071661 | 5.503028980456293 | 5.536944483174011 | 6.181511946488172 | {'data': (1024, 1024)} |
  196. | erfinv | 0.14420972962398082 | 0.14249852392822504 | 0.14795318129472437 | 0.17099211399909137 | {'data': (10000, 1)} |
  197. | erfinv | 5.234347780351527 | 5.201331019634381 | 5.2292247011791915 | 5.939365220256153 | {'data': (10000, 100)} |
  198. | exp | 0.46826651378069073 | 0.4664734879042953 | 0.47664131270721555 | 0.48756105650682 | {'data': (1024, 1024)} |
  199. | exp | 0.047931778244674206 | 0.04770199302583933 | 0.04975340561941266 | 0.062354890978895135 | {'data': (10000, 1)} |
  200. | exp | 0.44992151902988553 | 0.44879800407215953 | 0.45759761123917997 | 0.4651269997702912 | {'data': (10000, 100)} |
  201. | expm1 | 1.3053829915588722 | 1.2928230280522257 | 1.3057496631518006 | 1.9391858275048437 | {'data': (1024, 1024)} |
  202. | expm1 | 0.14792724861763418 | 0.14487249427475035 | 0.15274108736775815 | 0.21859470230992895 | {'data': (10000, 1)} |
  203. | expm1 | 1.2471957091474906 | 1.2298005167394876 | 1.2428864953108132 | 1.918388529447839 | {'data': (10000, 100)} |
  204. | fix | 0.22834838018752635 | 0.22681447444483638 | 0.23423833190463483 | 0.24033016874454924 | {'data': (1024, 1024)} |
  205. | fix | 0.07415675208903849 | 0.07343699689954519 | 0.07410210091620684 | 0.08780257834587256 | {'data': (10000, 1)} |
  206. | fix | 0.22058654809370637 | 0.21921450388617814 | 0.22589970612898472 | 0.23713353672064844 | {'data': (10000, 100)} |
  207. | flatten | 1.275658038794063 | 1.2751714675687253 | 1.2986565940082073 | 1.3024954503634945 | {'data': (1024, 1024)} |
  208. | flatten | 0.03150251635815948 | 0.029850489227101207 | 0.03285968559794128 | 0.05388255114667134 | {'data': (10000, 1)} |
  209. | flatten | 1.2649763067020103 | 1.26629151054658 | 1.2791522196494043 | 1.2968258070759475 | {'data': (10000, 100)} |
  210. | flip | 0.2321764366934076 | 0.23048548609949648 | 0.2364260784815997 | 0.26218589104246354 | {'data': (1024, 1024), 'axis': 0} |
  211. | flip | 0.0623907771660015 | 0.06175946327857673 | 0.06464548059739172 | 0.07738658809103079 | {'data': (10000, 1), 'axis': 0} |
  212. | flip | 0.22293045127298683 | 0.22181752137839794 | 0.2253075072076172 | 0.24018510826863354 | {'data': (10000, 100), 'axis': 0} |
  213. | floor | 0.10794324974995106 | 0.10711050708778203 | 0.10967010166496038 | 0.1199620618717746 | {'data': (1024, 1024)} |
  214. | floor | 0.053944067913107574 | 0.05321649950928986 | 0.0537852116394788 | 0.0682597002014519 | {'data': (10000, 1)} |
  215. | floor | 0.1059126277687028 | 0.10425198706798255 | 0.10726343025453389 | 0.1380038977367807 | {'data': (10000, 100)} |
  216. | ftml_update | 1.0696853691479191 | 1.0667530004866421 | 1.079452713020146 | 1.0858212312450632 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'd': (1024, 1024), 'v': (1024, 1024), 'z': (1024, 1024), 'lr': 0.1, 'beta1': 0.1, 'beta2': 0.1, 'epsilon': 1e-08, 't': 1, 'rescale_grad': 0.4, 'clip_grad': -1.0} |
  217. | ftml_update | 0.0946981186280027 | 0.09028197382576764 | 0.09464503382332623 | 0.13240553380455952 | {'weight': (10000, 1), 'grad': (10000, 1), 'd': (10000, 1), 'v': (10000, 1), 'z': (10000, 1), 'lr': 0.5, 'beta1': 0.5, 'beta2': 0.5, 'epsilon': 1e-08, 't': 1, 'rescale_grad': 0.4, 'clip_grad': -1.0} |
  218. | ftml_update | 1.1280413117492571 | 1.0758799908217043 | 1.3303226209245622 | 1.3978971377946436 | {'weight': (10000, 100), 'grad': (10000, 100), 'd': (10000, 100), 'v': (10000, 100), 'z': (10000, 100), 'lr': 0.9, 'beta1': 0.9, 'beta2': 0.9, 'epsilon': 1e-08, 't': 1, 'rescale_grad': 0.4, 'clip_grad': -1.0} |
  219. | ftrl_update | 0.8874610305065289 | 0.8763534715399146 | 0.9397255955263973 | 0.9847382333828137 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'z': (1024, 1024), 'n': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4} |
  220. | ftrl_update | 0.07559165358543396 | 0.07406200165860355 | 0.07709478959441186 | 0.11342019424773775 | {'weight': (10000, 1), 'grad': (10000, 1), 'z': (10000, 1), 'n': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4} |
  221. | ftrl_update | 0.9154607547679916 | 0.8737150055821985 | 1.0517397371586414 | 1.3304632430663335 | {'weight': (10000, 100), 'grad': (10000, 100), 'z': (10000, 100), 'n': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4} |
  222. | gamma | 8.07941191829741 | 8.065232512308285 | 8.074487652629614 | 8.680866308277473 | {'data': (1024, 1024)} |
  223. | gamma | 0.1986669300822541 | 0.1933590101543814 | 0.19827630603685975 | 0.23059808881953558 | {'data': (10000, 1)} |
  224. | gamma | 6.9233430188614875 | 7.680763985263184 | 7.69865334732458 | 8.368486235267488 | {'data': (10000, 100)} |
  225. | gammaln | 21.85047817940358 | 21.722670004237443 | 22.05058957915753 | 23.373431288055144 | {'data': (1024, 1024)} |
  226. | gammaln | 0.3046635282225907 | 0.29874948086217046 | 0.3055752895306796 | 0.3221910615684489 | {'data': (10000, 1)} |
  227. | gammaln | 20.75877398950979 | 20.691349491244182 | 20.730123401153833 | 21.449550547986316 | {'data': (10000, 100)} |
  228. | hard_sigmoid | 0.27135398879181594 | 0.26897049974650145 | 0.2823843795340508 | 0.2908784034661949 | {'data': (1024, 1024), 'alpha': 0.25, 'beta': 0.5} |
  229. | hard_sigmoid | 0.16004401200916618 | 0.15836648526601493 | 0.16527281259186566 | 0.19466504978481694 | {'data': (10000, 1), 'alpha': 0.25, 'beta': 0.5} |
  230. | hard_sigmoid | 0.2643894567154348 | 0.2631029929034412 | 0.27166329091414815 | 0.30082823068369186 | {'data': (10000, 100), 'alpha': 0.25, 'beta': 0.5} |
  231. | identity | 1.2446485995315015 | 1.2457680131774396 | 1.2619168031960726 | 1.266698133549653 | {'data': (1024, 1024)} |
  232. | identity | 0.03837997035589069 | 0.03747647861018777 | 0.03842011792585254 | 0.05617823277134462 | {'data': (10000, 1)} |
  233. | identity | 1.2568573578028008 | 1.256686489796266 | 1.2724430882371962 | 1.2818714953027666 | {'data': (10000, 100)} |
  234. | log | 0.5225845793029293 | 0.5081069830339402 | 0.5179952073376626 | 1.134516522288323 | {'data': (1024, 1024)} |
  235. | log | 0.14740398968569934 | 0.14594601816497743 | 0.15207339311018586 | 0.16763778345193728 | {'data': (10000, 1)} |
  236. | log | 0.5045631382381544 | 0.48823151155374944 | 0.49984988290816545 | 1.171624617418275 | {'data': (10000, 100)} |
  237. | log10 | 0.8690233493689448 | 0.7759665022604167 | 0.7878979842644186 | 2.256068953429392 | {'data': (1024, 1024)} |
  238. | log10 | 0.14646837080363184 | 0.14362498768605292 | 0.14983458095230165 | 0.1754160632845021 | {'data': (10000, 1)} |
  239. | log10 | 0.814528011251241 | 0.7434360159095377 | 0.8538965717889369 | 1.4251910074381253 | {'data': (10000, 100)} |
  240. | log1p | 0.8971280133118853 | 0.9103955235332251 | 0.9390499151777476 | 1.614437153330078 | {'data': (1024, 1024)} |
  241. | log1p | 0.17378835880663246 | 0.17094999202527106 | 0.18312595784664154 | 0.19954157643951498 | {'data': (10000, 1)} |
  242. | log1p | 0.9093655733158812 | 0.9012784867081791 | 0.9260724997147918 | 1.614686710527167 | {'data': (10000, 100)} |
  243. | log2 | 0.6567541393451393 | 0.6416245014406741 | 0.6526465760543942 | 1.2617219256935648 | {'data': (1024, 1024)} |
  244. | log2 | 0.1468039833707735 | 0.1452020078431815 | 0.15152408159337938 | 0.1655671774642544 | {'data': (10000, 1)} |
  245. | log2 | 0.6561819894704968 | 0.612737494520843 | 0.7280792982783169 | 1.291884622769431 | {'data': (10000, 100)} |
  246. | log_softmax | 1.9050724926637486 | 1.9052224815823138 | 1.9126463681459427 | 1.91823260684032 | {'data': (1024, 1024), 'axis': -1, 'temperature': 0.5} |
  247. | log_softmax | 0.18009843886829913 | 0.1778354635462165 | 0.1877829374279827 | 0.20008120918646471 | {'data': (10000, 1), 'axis': -1, 'temperature': 0.5} |
  248. | log_softmax | 1.8047690502135083 | 1.8052074883598834 | 1.811245211865753 | 1.8295876565389337 | {'data': (10000, 100), 'axis': -1, 'temperature': 0.5} |
  249. | logical_not | 0.06023157562594861 | 0.05900298128835857 | 0.06297072977758944 | 0.0854212709236891 | {'data': (1024, 1024)} |
  250. | logical_not | 0.04605321679264307 | 0.045040505938231945 | 0.045925471931695945 | 0.06006411858834338 | {'data': (10000, 1)} |
  251. | logical_not | 0.06104564934503287 | 0.05952600622549653 | 0.06285890121944249 | 0.0958294107113035 | {'data': (10000, 100)} |
  252. | make_loss | 1.2135857582325116 | 1.2146819790359586 | 1.231602526968345 | 1.2395317031769082 | {'data': (1024, 1024)} |
  253. | make_loss | 0.04000872315373272 | 0.03942247712984681 | 0.04000160261057317 | 0.055909079965204056 | {'data': (10000, 1)} |
  254. | make_loss | 1.2016182456864044 | 1.2019970163237303 | 1.2135006312746555 | 1.2254288682015615 | {'data': (10000, 100)} |
  255. | max | 0.7700030482374132 | 0.7670480117667466 | 0.7803990738466382 | 0.8004772564163433 | {'data': (1024, 1024), 'axis': 0} |
  256. | max | 0.21371782757341862 | 0.21252100123092532 | 0.21876239334233105 | 0.22807258006650963 | {'data': (10000, 1), 'axis': 0} |
  257. | max | 1.7800016672117636 | 1.2396355159580708 | 1.8055129563435912 | 4.333400481264357 | {'data': (10000, 100), 'axis': 0} |
  258. | max_axis | 0.6816166418138891 | 0.679730495903641 | 0.6895889178849757 | 0.709880235954188 | {'data': (1024, 1024), 'axis': 0} |
  259. | max_axis | 0.11862389394082129 | 0.11782400542870164 | 0.1199557154905051 | 0.13743173563852926 | {'data': (10000, 1), 'axis': 0} |
  260. | max_axis | 0.5587640416342765 | 0.550464988918975 | 0.57424585102126 | 0.5901562684448448 | {'data': (10000, 100), 'axis': 0} |
  261. | mean | 1.936670567956753 | 1.9261764828115702 | 1.9414848065935075 | 2.0847332390258093 | {'data': (1024, 1024), 'axis': 0} |
  262. | mean | 0.2428105112630874 | 0.2422815014142543 | 0.24974953848868608 | 0.26026101317256695 | {'data': (10000, 1), 'axis': 0} |
  263. | mean | 1.780869213398546 | 1.7585134773980826 | 1.8750887538772076 | 1.9528717274079102 | {'data': (10000, 100), 'axis': 0} |
  264. | min | 1.2643861240940168 | 1.2469355133362114 | 1.3698606344405562 | 1.3920145109295847 | {'data': (1024, 1024), 'axis': 0} |
  265. | min | 0.23868698859587312 | 0.20548250176943839 | 0.28808509814552963 | 0.35870582098141324 | {'data': (10000, 1), 'axis': 0} |
  266. | min | 1.349409141112119 | 1.154684490757063 | 1.7732545325998217 | 1.9299304031301392 | {'data': (10000, 100), 'axis': 0} |
  267. | min_axis | 0.6888521509245038 | 0.6858265260234475 | 0.6981764745432884 | 0.7149874547030778 | {'data': (1024, 1024), 'axis': 0} |
  268. | min_axis | 0.1483784627635032 | 0.14769850531592965 | 0.15038332203403115 | 0.1613077812362463 | {'data': (10000, 1), 'axis': 0} |
  269. | min_axis | 0.5714807065669447 | 0.5695194704458117 | 0.5818260658998042 | 0.6028741778573031 | {'data': (10000, 100), 'axis': 0} |
  270. | mp_sgd_mom_update | 0.1976874005049467 | 0.19624052220024168 | 0.2028913295362145 | 0.21613885823171586 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'mom': (1024, 1024), 'weight32': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4, 'lazy_update': 0} |
  271. | mp_sgd_mom_update | 0.07257528137415648 | 0.07189851021394134 | 0.07539350772276521 | 0.08759390912018725 | {'weight': (10000, 1), 'grad': (10000, 1), 'mom': (10000, 1), 'weight32': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4, 'lazy_update': 0} |
  272. | mp_sgd_mom_update | 0.19135746115352958 | 0.19018552848137915 | 0.19436219008639455 | 0.2079788740957156 | {'weight': (10000, 100), 'grad': (10000, 100), 'mom': (10000, 100), 'weight32': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4, 'lazy_update': 0} |
  273. | mp_sgd_update | 0.15778089698869735 | 0.1563024998176843 | 0.16050877165980637 | 0.17561951244715604 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'weight32': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4, 'lazy_update': 0} |
  274. | mp_sgd_update | 0.07022538396995515 | 0.06965748616494238 | 0.0729149382095784 | 0.08290749276056891 | {'weight': (10000, 1), 'grad': (10000, 1), 'weight32': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4, 'lazy_update': 0} |
  275. | mp_sgd_update | 0.1532155816676095 | 0.15194001025520265 | 0.15563609777018428 | 0.17364571627695116 | {'weight': (10000, 100), 'grad': (10000, 100), 'weight32': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4, 'lazy_update': 0} |
  276. | nanprod | 1.3743750390131027 | 1.333311985945329 | 1.4514431648422033 | 1.4844371483195573 | {'data': (1024, 1024), 'axis': 0} |
  277. | nanprod | 0.20412367419339716 | 0.20327247329987586 | 0.20980145782232287 | 0.21693864779081204 | {'data': (10000, 1), 'axis': 0} |
  278. | nanprod | 1.4446606126148254 | 1.2732655159197748 | 1.9435975118540227 | 2.0862253999803215 | {'data': (10000, 100), 'axis': 0} |
  279. | nansum | 1.28231015172787 | 1.2793370115105063 | 1.2940461339894682 | 1.3042744738049805 | {'data': (1024, 1024), 'axis': 0} |
  280. | nansum | 0.2148767892504111 | 0.21418152027763426 | 0.22058351896703243 | 0.22769369010347879 | {'data': (10000, 1), 'axis': 0} |
  281. | nansum | 1.1612215742934495 | 1.1421320086810738 | 1.242294005351141 | 1.2668383843265476 | {'data': (10000, 100), 'axis': 0} |
  282. | negative | 0.06775593152269721 | 0.06738601950928569 | 0.07041482604108751 | 0.08617439772933722 | {'data': (1024, 1024)} |
  283. | negative | 0.05091671191621572 | 0.050489004934206605 | 0.05093610961921513 | 0.06409965630155061 | {'data': (10000, 1)} |
  284. | negative | 0.06653283257037401 | 0.06566502270288765 | 0.06882718880660832 | 0.0871763384202496 | {'data': (10000, 100)} |
  285. | ones_like | 0.06557988584972918 | 0.065032480051741 | 0.06775257643312216 | 0.08089038834441455 | {'data': (1024, 1024)} |
  286. | ones_like | 0.05092323524877429 | 0.050625967560335994 | 0.05118437693454325 | 0.05983732524327935 | {'data': (10000, 1)} |
  287. | ones_like | 0.06550552847329527 | 0.06454598042182624 | 0.06773619679734111 | 0.08467662264592955 | {'data': (10000, 100)} |
  288. | prod | 1.8085357907693833 | 1.2674809840973467 | 1.2880909140221777 | 5.653123274678597 | {'data': (1024, 1024), 'axis': 0} |
  289. | prod | 0.2053508337121457 | 0.20317098824307323 | 0.21196962334215644 | 0.22864818340167428 | {'data': (10000, 1), 'axis': 0} |
  290. | prod | 1.8374364782357588 | 1.1476950021460652 | 1.9285164831671864 | 2.5991235475523977 | {'data': (10000, 100), 'axis': 0} |
  291. | radians | 0.2218272292520851 | 0.2020465035457164 | 0.20901624229736626 | 0.8218429156113448 | {'data': (1024, 1024)} |
  292. | radians | 0.15390957705676556 | 0.1520054938737303 | 0.15739889931865036 | 0.18013169057667291 | {'data': (10000, 1)} |
  293. | radians | 0.1934293343219906 | 0.17117499373853207 | 0.17836441984400153 | 0.8614059491083063 | {'data': (10000, 100)} |
  294. | random_exponential | 1.6689918411429971 | 1.661767513724044 | 1.6965274175163358 | 1.7435537511482837 | {'shape': (1024, 1024)} |
  295. | random_exponential | 0.07287354557774961 | 0.07191248005256057 | 0.07466660463251173 | 0.08775576076004664 | {'shape': (10000, 1)} |
  296. | random_exponential | 1.6000147484010085 | 1.5937014832161367 | 1.6254660615231842 | 1.6579969582380727 | {'shape': (10000, 100)} |
  297. | random_gamma | 5.160008341190405 | 5.152459518285468 | 5.230046872748062 | 5.267579759238288 | {'shape': (1024, 1024)} |
  298. | random_gamma | 0.11324453691486269 | 0.11174901737831533 | 0.115206278860569 | 0.13890265545342123 | {'shape': (10000, 1)} |
  299. | random_gamma | 4.9053277797065675 | 4.885275528067723 | 4.975577513687313 | 5.027431431226432 | {'shape': (10000, 100)} |
  300. | random_generalized_negative_binomial | 7.10422990960069 | 6.975835975026712 | 7.070625957567245 | 9.8925521830097 | {'shape': (1024, 1024)} |
  301. | random_generalized_negative_binomial | 0.13358782627619803 | 0.13256951933726668 | 0.13544501271098852 | 0.15605266438797125 | {'shape': (10000, 1)} |
  302. | random_generalized_negative_binomial | 4.9780211399775 | 4.639184015104547 | 6.655612308532 | 6.754448653082363 | {'shape': (10000, 100)} |
  303. | random_negative_binomial | 4.627276086248457 | 4.107939486857504 | 5.90737996972166 | 6.062108909827659 | {'k': 1, 'p': 1, 'shape': (1024, 1024)} |
  304. | random_negative_binomial | 0.1145187730435282 | 0.10561200906522572 | 0.12959482264705002 | 0.14771858870517474 | {'k': 1, 'p': 1, 'shape': (10000, 1)} |
  305. | random_negative_binomial | 3.92029287701007 | 3.919228503946215 | 3.928655432537198 | 3.949978604214266 | {'k': 1, 'p': 1, 'shape': (10000, 100)} |
  306. | random_normal | 1.2883959716418758 | 1.2851950014010072 | 1.2968061259016395 | 1.324167717830278 | {'shape': (1024, 1024)} |
  307. | random_normal | 0.06683776795398444 | 0.06565049989148974 | 0.06814494845457375 | 0.08704369014594716 | {'shape': (10000, 1)} |
  308. | random_normal | 1.2312225927598774 | 1.2290724844206125 | 1.2388053757604212 | 1.2481998006114736 | {'shape': (10000, 100)} |
  309. | random_pdf_dirichlet | 0.0498343090293929 | 0.04911652649752796 | 0.05083670839667321 | 0.060715774889104186 | {'sample': (2,), 'alpha': [0.0, 2.5]} |
  310. | random_pdf_exponential | 0.04986926156561822 | 0.04900502972304821 | 0.051665672799572356 | 0.06311338860541592 | {'sample': (2,), 'lam': [1.0, 8.5]} |
  311. | random_pdf_gamma | 0.1315904187504202 | 0.05108703044243157 | 0.05359878414310515 | 3.7392735917819695 | {'sample': (2,), 'alpha': [0.0, 2.5], 'beta': [1.0, 0.7]} |
  312. | random_pdf_generalized_negative_binomial | 0.050876527675427496 | 0.050291011575609446 | 0.05256770527921617 | 0.06218726397492002 | {'sample': (2,), 'mu': [2.0, 2.5], 'alpha': [0.0, 2.5]} |
  313. | random_pdf_negative_binomial | 0.051251741824671626 | 0.050619011744856834 | 0.05294840084388852 | 0.06229427061043692 | {'sample': (2,), 'k': [20, 49], 'p': [0.4, 0.77]} |
  314. | random_pdf_normal | 0.05165208945982158 | 0.05111948121339083 | 0.05305251688696444 | 0.061698253848590075 | {'sample': (2,), 'mu': [2.0, 2.5], 'sigma': [1.0, 3.7]} |
  315. | random_pdf_poisson | 0.049168537952937186 | 0.04853797145187855 | 0.050916807958856225 | 0.060049401363358 | {'sample': (2,), 'lam': [1.0, 8.5]} |
  316. | random_pdf_uniform | 0.0511011912021786 | 0.05040998803451657 | 0.052556092850863934 | 0.06414993724320094 | {'sample': (2,), 'low': [0.0, 2.5], 'high': [1.0, 3.7]} |
  317. | random_poisson | 1.6358446498634294 | 1.6494925366714597 | 1.6753080708440393 | 1.684981695143506 | {'shape': (1024, 1024)} |
  318. | random_poisson | 0.07311799912713468 | 0.07183951674960554 | 0.07511303410865366 | 0.09384217555634693 | {'shape': (10000, 1)} |
  319. | random_poisson | 1.5821520192548633 | 1.5805290022399276 | 1.5974916284903884 | 1.615850881789811 | {'shape': (10000, 100)} |
  320. | random_randint | 0.8883909933501855 | 0.8874920313246548 | 0.9030393266584724 | 0.9184293425641954 | {'low': 0, 'high': 5, 'shape': (1024, 1024)} |
  321. | random_randint | 0.07078660884872079 | 0.06952698458917439 | 0.07290859939530492 | 0.08832377789076436 | {'low': 0, 'high': 5, 'shape': (10000, 1)} |
  322. | random_randint | 0.8288717741379514 | 0.8220445306506008 | 0.8557264925912023 | 0.8870274003129452 | {'low': 0, 'high': 5, 'shape': (10000, 100)} |
  323. | random_uniform | 0.422120273578912 | 0.41789549868553877 | 0.43485640781000257 | 0.47931195644196134 | {'low': 0, 'high': 5, 'shape': (1024, 1024)} |
  324. | random_uniform | 0.0713254587026313 | 0.07030353299342096 | 0.07364279590547085 | 0.08794212830252962 | {'low': 0, 'high': 5, 'shape': (10000, 1)} |
  325. | random_uniform | 0.4109054576838389 | 0.4089379799552262 | 0.4191936401184648 | 0.44117068697232764 | {'low': 0, 'high': 5, 'shape': (10000, 100)} |
  326. | rcbrt | 2.0656499202596024 | 2.05329546588473 | 2.061983780004084 | 2.674573036492802 | {'data': (1024, 1024)} |
  327. | rcbrt | 0.14863287098705769 | 0.14662000467069447 | 0.1556144910864532 | 0.16820509277749823 | {'data': (10000, 1)} |
  328. | rcbrt | 1.9748128793435171 | 1.9616835052147508 | 1.9715616188477725 | 2.6244890072848652 | {'data': (10000, 100)} |
  329. | reciprocal | 0.20052903273608536 | 0.18026697216555476 | 0.19091302528977394 | 0.8314069535117626 | {'data': (1024, 1024)} |
  330. | reciprocal | 0.13829048548359424 | 0.1361760077998042 | 0.14318323228508234 | 0.17348610272165402 | {'data': (10000, 1)} |
  331. | reciprocal | 0.19677920441608876 | 0.17588899936527014 | 0.18485053442418575 | 0.867897825082767 | {'data': (10000, 100)} |
  332. | relu | 0.23958479869179428 | 0.22060799528844655 | 0.23153058136813343 | 0.8125600375933603 | {'data': (1024, 1024)} |
  333. | relu | 0.14363801921717823 | 0.1418330066371709 | 0.14779979246668518 | 0.16535636154003458 | {'data': (10000, 1)} |
  334. | relu | 0.23239118105266243 | 0.211919512366876 | 0.22073679137974977 | 0.8474795689107882 | {'data': (10000, 100)} |
  335. | rint | 0.18917557958047837 | 0.18825649749487638 | 0.19086640095338225 | 0.19983281963504854 | {'data': (1024, 1024)} |
  336. | rint | 0.07936700363643467 | 0.07879096665419638 | 0.07921598735265434 | 0.09344052465166898 | {'data': (10000, 1)} |
  337. | rint | 0.18276886024978012 | 0.18225453095510602 | 0.18494997057132423 | 0.19589839735999712 | {'data': (10000, 100)} |
  338. | rmsprop_update | 0.3255842375801876 | 0.32385598751716316 | 0.33409808529540896 | 0.33973579760640865 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'n': (1024, 1024), 'lr': 0.1, 'gamma1': 0.1, 'epsilon': 1e-08, 'rescale_grad': 0.4} |
  339. | rmsprop_update | 0.07354485162068158 | 0.07262700819410384 | 0.07539482903666794 | 0.09214173653163032 | {'weight': (10000, 1), 'grad': (10000, 1), 'n': (10000, 1), 'lr': 0.5, 'gamma1': 0.5, 'epsilon': 1e-08, 'rescale_grad': 0.4} |
  340. | rmsprop_update | 0.4183006670791656 | 0.3546335210558027 | 0.6344049877952784 | 0.7359237282071263 | {'weight': (10000, 100), 'grad': (10000, 100), 'n': (10000, 100), 'lr': 0.9, 'gamma1': 0.9, 'epsilon': 1e-08, 'rescale_grad': 0.4} |
  341. | rmspropalex_update | 0.5148533411556855 | 0.5131405196152627 | 0.5241744336672127 | 0.5272967409109697 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'n': (1024, 1024), 'g': (1024, 1024), 'delta': (1024, 1024), 'lr': 0.1, 'gamma1': 0.1, 'gamma2': 0.1, 'epsilon': 1e-08, 'rescale_grad': 0.4} |
  342. | rmspropalex_update | 0.08282772614620626 | 0.08187550702132285 | 0.08657683501951396 | 0.09562484570778919 | {'weight': (10000, 1), 'grad': (10000, 1), 'n': (10000, 1), 'g': (10000, 1), 'delta': (10000, 1), 'lr': 0.5, 'gamma1': 0.5, 'gamma2': 0.5, 'epsilon': 1e-08, 'rescale_grad': 0.4} |
  343. | rmspropalex_update | 0.8168537024175748 | 0.8099979895632714 | 0.8499103132635355 | 0.8709201135206969 | {'weight': (10000, 100), 'grad': (10000, 100), 'n': (10000, 100), 'g': (10000, 100), 'delta': (10000, 100), 'lr': 0.9, 'gamma1': 0.9, 'gamma2': 0.9, 'epsilon': 1e-08, 'rescale_grad': 0.4} |
  344. | round | 0.2572770119877532 | 0.25640599778853357 | 0.2620399056468159 | 0.2705810044426471 | {'data': (1024, 1024)} |
  345. | round | 0.09428749675862491 | 0.09348348248749971 | 0.0950915098655969 | 0.10787214792799207 | {'data': (10000, 1)} |
  346. | round | 0.24970000085886568 | 0.24887948529794812 | 0.25347271002829075 | 0.2601550874533132 | {'data': (10000, 100)} |
  347. | rsqrt | 1.0430975339841098 | 1.0294615058228374 | 1.0387022979557514 | 1.6443354438524698 | {'data': (1024, 1024)} |
  348. | rsqrt | 0.14565656892955303 | 0.1436159946024418 | 0.15589671675115824 | 0.17018059734255092 | {'data': (10000, 1)} |
  349. | rsqrt | 1.0013462201459333 | 0.9871490183286369 | 0.9949771279934794 | 1.653206375194714 | {'data': (10000, 100)} |
  350. | sample_exponential | 3.103664413210936 | 3.2404420198872685 | 3.270644770236686 | 3.2769259781343862 | {'lam': [1.0, 8.5], 'shape': (1024, 1024)} |
  351. | sample_exponential | 0.07804503897204995 | 0.07651851046830416 | 0.07959639187902212 | 0.10108391230460273 | {'lam': [1.0, 8.5], 'shape': (10000, 1)} |
  352. | sample_exponential | 2.3135353811085224 | 2.3127780004870147 | 2.3210379877127707 | 2.3585093137808144 | {'lam': [1.0, 8.5], 'shape': (10000, 100)} |
  353. | sample_gamma | 8.10772821016144 | 8.079962019110098 | 8.09890519012697 | 8.505651394953029 | {'alpha': [0.0, 2.5], 'shape': (1024, 1024), 'beta': [1.0, 0.7]} |
  354. | sample_gamma | 0.13890357629861683 | 0.13763498282060027 | 0.14107489841990173 | 0.15912925882730652 | {'alpha': [0.0, 2.5], 'shape': (10000, 1), 'beta': [1.0, 0.7]} |
  355. | sample_gamma | 7.714066429180093 | 7.712843507761136 | 7.725121633848175 | 7.7346836775541306 | {'alpha': [0.0, 2.5], 'shape': (10000, 100), 'beta': [1.0, 0.7]} |
  356. | sample_generalized_negative_binomial | 29.818685303325765 | 29.793374997098 | 29.993763979291543 | 30.130209782510068 | {'mu': [2.0, 2.5], 'shape': (1024, 1024), 'alpha': [0.0, 2.5]} |
  357. | sample_generalized_negative_binomial | 0.3510364185785875 | 0.34978502662852407 | 0.36217287415638566 | 0.39459118968807166 | {'mu': [2.0, 2.5], 'shape': (10000, 1), 'alpha': [0.0, 2.5]} |
  358. | sample_generalized_negative_binomial | 28.50679499679245 | 28.50984549149871 | 28.587236715247855 | 28.674334059469402 | {'mu': [2.0, 2.5], 'shape': (10000, 100), 'alpha': [0.0, 2.5]} |
  359. | sample_negative_binomial | 289.6374146826565 | 291.4460370084271 | 293.73846676317044 | 295.735945237102 | {'k': [20, 49], 'shape': (1024, 1024), 'p': [0.4, 0.77]} |
  360. | sample_negative_binomial | 2.8527684597065672 | 2.8524735243991017 | 2.8667104023043066 | 2.8848991345148534 | {'k': [20, 49], 'shape': (10000, 1), 'p': [0.4, 0.77]} |
  361. | sample_negative_binomial | 277.3412921797717 | 277.5989305227995 | 277.77493381872773 | 277.87741450127214 | {'k': [20, 49], 'shape': (10000, 100), 'p': [0.4, 0.77]} |
  362. | sample_normal | 3.759762817644514 | 3.7647089920938015 | 3.7762359774205834 | 3.7908726144814864 | {'mu': [2.0, 2.5], 'shape': (1024, 1024), 'sigma': [1.0, 3.7]} |
  363. | sample_normal | 0.1001852669287473 | 0.09924400364980102 | 0.10205479338765144 | 0.11395038338378086 | {'mu': [2.0, 2.5], 'shape': (10000, 1), 'sigma': [1.0, 3.7]} |
  364. | sample_normal | 3.594054530840367 | 3.594805981265381 | 3.603029460646212 | 3.6184913950273767 | {'mu': [2.0, 2.5], 'shape': (10000, 100), 'sigma': [1.0, 3.7]} |
  365. | sample_poisson | 5.039050009800121 | 4.730237473268062 | 6.693922885460779 | 6.700793453492224 | {'lam': [1.0, 8.5], 'shape': (1024, 1024)} |
  366. | sample_poisson | 0.10983291314914823 | 0.10881401249207556 | 0.11180301662534475 | 0.12654320045840006 | {'lam': [1.0, 8.5], 'shape': (10000, 1)} |
  367. | sample_poisson | 5.607051390688866 | 6.27343900850974 | 6.3541601004544646 | 6.392438903567381 | {'lam': [1.0, 8.5], 'shape': (10000, 100)} |
  368. | sample_uniform | 0.7781208824599162 | 0.7754084945190698 | 0.7871668960433453 | 0.8038860326632857 | {'low': [0.0, 2.5], 'shape': (1024, 1024), 'high': [1.0, 3.7]} |
  369. | sample_uniform | 0.07735782884992659 | 0.07648149039596319 | 0.08039931417442858 | 0.08920880791265524 | {'low': [0.0, 2.5], 'shape': (10000, 1), 'high': [1.0, 3.7]} |
  370. | sample_uniform | 0.7057806017110124 | 0.7519450155086815 | 0.7628178922459483 | 0.7821745192632079 | {'low': [0.0, 2.5], 'shape': (10000, 100), 'high': [1.0, 3.7]} |
  371. | sgd_mom_update | 0.18676045932807028 | 0.18514052499085665 | 0.19183901604264975 | 0.20677088818047196 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'mom': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4, 'lazy_update': 0} |
  372. | sgd_mom_update | 0.07138170243706554 | 0.07034049485810101 | 0.07424908108077943 | 0.08557719702366748 | {'weight': (10000, 1), 'grad': (10000, 1), 'mom': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4, 'lazy_update': 0} |
  373. | sgd_mom_update | 0.18118395819328725 | 0.17989648040384054 | 0.18395768711343408 | 0.1996332040289417 | {'weight': (10000, 100), 'grad': (10000, 100), 'mom': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4, 'lazy_update': 0} |
  374. | sgd_update | 0.15505328599829227 | 0.15382000128738582 | 0.1591979875229299 | 0.16661663539707663 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4, 'lazy_update': 0} |
  375. | sgd_update | 0.06916576181538403 | 0.06775750080123544 | 0.0709360814653337 | 0.11118717840872715 | {'weight': (10000, 1), 'grad': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4, 'lazy_update': 0} |
  376. | sgd_update | 0.15035710181109607 | 0.14919351087883115 | 0.15455711400136354 | 0.16375916951801628 | {'weight': (10000, 100), 'grad': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4, 'lazy_update': 0} |
  377. | shape_array | 0.03747223818209022 | 0.03803949221037328 | 0.03844329621642828 | 0.04761492542456836 | {'data': (1024, 1024)} |
  378. | shape_array | 0.03575138805899769 | 0.037277000956237316 | 0.038272986421361566 | 0.04450845532119274 | {'data': (10000, 1)} |
  379. | shape_array | 0.036844112328253686 | 0.03775599179789424 | 0.038299610605463386 | 0.04074043943546713 | {'data': (10000, 100)} |
  380. | shuffle | 1.6088540724013 | 1.6098505002446473 | 1.628114638151601 | 1.6523347230395302 | {'data': (1024, 1024)} |
  381. | shuffle | 0.31532989523839206 | 0.3141020133625716 | 0.32006812980398536 | 0.3257947380188853 | {'data': (10000, 1)} |
  382. | shuffle | 2.035430152900517 | 2.0340069895610213 | 2.050024800701067 | 2.0913318480597813 | {'data': (10000, 100)} |
  383. | sigmoid | 0.6232413684483618 | 0.6076100107748061 | 0.620775792049244 | 1.2628356483764953 | {'data': (1024, 1024)} |
  384. | sigmoid | 0.14693689707200974 | 0.1449644914828241 | 0.15152082196436822 | 0.1831087307073177 | {'data': (10000, 1)} |
  385. | sigmoid | 0.5960995203349739 | 0.5794070020783693 | 0.5912494845688343 | 1.2868897750740877 | {'data': (10000, 100)} |
  386. | sign | 0.3083832369884476 | 0.28953602304682136 | 0.30010009650141 | 0.9720192692475413 | {'data': (1024, 1024)} |
  387. | sign | 0.13602570164948702 | 0.13467049575410783 | 0.1409970864187926 | 0.16665813920553788 | {'data': (10000, 1)} |
  388. | sign | 0.29493152804207057 | 0.2758894697763026 | 0.28272412600927055 | 0.9793754626298345 | {'data': (10000, 100)} |
  389. | signsgd_update | 0.1884189818520099 | 0.18722651293501258 | 0.19188617006875575 | 0.2071467525092885 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4} |
  390. | signsgd_update | 0.0660248997155577 | 0.06518600275740027 | 0.06864342140033841 | 0.08118516940157866 | {'weight': (10000, 1), 'grad': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4} |
  391. | signsgd_update | 0.18157600541599095 | 0.18059497233480215 | 0.18422811990603805 | 0.1932645303895697 | {'weight': (10000, 100), 'grad': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4} |
  392. | signum_update | 0.2678319450933486 | 0.26636800612322986 | 0.27332708123140037 | 0.2827174082631245 | {'weight': (1024, 1024), 'grad': (1024, 1024), 'mom': (1024, 1024), 'lr': 0.1, 'rescale_grad': 0.4} |
  393. | signum_update | 0.06867849384434521 | 0.0679665245115757 | 0.0705031561665237 | 0.08456938259769237 | {'weight': (10000, 1), 'grad': (10000, 1), 'mom': (10000, 1), 'lr': 0.5, 'rescale_grad': 0.4} |
  394. | signum_update | 0.259269053931348 | 0.2579870051704347 | 0.2646178880240768 | 0.2708843542495743 | {'weight': (10000, 100), 'grad': (10000, 100), 'mom': (10000, 100), 'lr': 0.9, 'rescale_grad': 0.4} |
  395. | sin | 0.814477571984753 | 0.7974489708431065 | 0.8077435952145606 | 1.4279647637158646 | {'data': (1024, 1024)} |
  396. | sin | 0.26866887987125665 | 0.2674704883247614 | 0.27462372090667486 | 0.2832211297936738 | {'data': (10000, 1)} |
  397. | sin | 0.7835786917712539 | 0.7659634866286069 | 0.7770048978272825 | 1.433139368309641 | {'data': (10000, 100)} |
  398. | sinh | 1.8941095017362386 | 1.8819655233528465 | 1.8894329899922013 | 2.5217662681825463 | {'data': (1024, 1024)} |
  399. | sinh | 0.15003525943029672 | 0.14851600280962884 | 0.15858784317970276 | 0.17265255562961118 | {'data': (10000, 1)} |
  400. | sinh | 1.8090908793965355 | 1.7955314833670855 | 1.8048797908704728 | 2.4594668089412157 | {'data': (10000, 100)} |
  401. | size_array | 0.034887269721366465 | 0.03629850107245147 | 0.03757701488211751 | 0.048868522280827165 | {'data': (1024, 1024)} |
  402. | size_array | 0.03679663874208927 | 0.03766396548599005 | 0.038234778912737966 | 0.044336544233374305 | {'data': (10000, 1)} |
  403. | size_array | 0.03659032052382827 | 0.037488003727048635 | 0.03790009650401771 | 0.04107669868972153 | {'data': (10000, 100)} |
  404. | softmax | 1.427406005677767 | 1.4264170022215694 | 1.4368790085427463 | 1.4413486170815304 | {'data': (1024, 1024), 'axis': -1, 'temperature': 0.5} |
  405. | softmax | 0.17845454101916403 | 0.17660498269833624 | 0.18476598197594285 | 0.19874883990269174 | {'data': (10000, 1), 'axis': -1, 'temperature': 0.5} |
  406. | softmax | 1.3585936988238245 | 1.3582954998128116 | 1.3678298040758818 | 1.3877526979194954 | {'data': (10000, 100), 'axis': -1, 'temperature': 0.5} |
  407. | softsign | 0.20246419531758875 | 0.18211250426247716 | 0.1917937013786286 | 0.8556467451853705 | {'data': (1024, 1024)} |
  408. | softsign | 0.14161004510242492 | 0.13996099005453289 | 0.14424497494474053 | 0.1755927462363617 | {'data': (10000, 1)} |
  409. | softsign | 0.19729594932869077 | 0.17589802155271173 | 0.1891649968456477 | 0.8554779971018466 | {'data': (10000, 100)} |
  410. | sort | 22.487551280646585 | 22.282456018729135 | 22.524265991523862 | 27.61729318764992 | {'data': (1024, 1024), 'axis': 0} |
  411. | sort | 0.8646850800141692 | 0.8641070162411779 | 0.8722322236280888 | 0.8853458467638121 | {'data': (10000, 1), 'axis': 0} |
  412. | sort | 16.624957256717607 | 16.57822751440108 | 16.59564939327538 | 17.935966078657664 | {'data': (10000, 100), 'axis': 0} |
  413. | space_to_depth | 0.07427438453305513 | 0.07386048673652112 | 0.07620226824656129 | 0.08837863802909854 | {'data': (1, 4, 2, 4), 'block_size': 2} |
  414. | space_to_depth | 0.25590041012037545 | 0.2543365117162466 | 0.2602819644380361 | 0.2862973435549068 | {'data': (10, 25, 10, 100), 'block_size': 5} |
  415. | sqrt | 0.5817626090720296 | 0.5666694778483361 | 0.5764872650615871 | 1.2220495054498322 | {'data': (1024, 1024)} |
  416. | sqrt | 0.14565934368874878 | 0.14418800128623843 | 0.1517611905001104 | 0.16692153352778422 | {'data': (10000, 1)} |
  417. | sqrt | 0.5559681233717129 | 0.5387470009736717 | 0.5502467858605087 | 1.2332921853521845 | {'data': (10000, 100)} |
  418. | square | 0.20375084830448031 | 0.18280150834470987 | 0.19268248579464856 | 0.8565650711534578 | {'data': (1024, 1024)} |
  419. | square | 0.13866512046661228 | 0.13719697017222643 | 0.14195937546901405 | 0.17822185880504557 | {'data': (10000, 1)} |
  420. | square | 0.19875364087056369 | 0.17649299115873873 | 0.18629412516020238 | 0.8992960228351912 | {'data': (10000, 100)} |
  421. | stop_gradient | 1.2040995701681823 | 1.2032579979859293 | 1.2220540025737137 | 1.2333702930482104 | {'data': (1024, 1024)} |
  422. | stop_gradient | 0.03661728871520609 | 0.03596101305447519 | 0.03662662929855287 | 0.0502844923175872 | {'data': (10000, 1)} |
  423. | stop_gradient | 1.1755091295344755 | 1.1807970295194536 | 1.211533771129325 | 1.215469865128398 | {'data': (10000, 100)} |
  424. | sum | 1.2881833495339379 | 1.2866549950558692 | 1.3004131731577218 | 1.3084662129404023 | {'data': (1024, 1024), 'axis': 0} |
  425. | sum | 0.33686749811749905 | 0.21571601973846555 | 0.22678239620290697 | 0.37194847420329735 | {'data': (10000, 1), 'axis': 0} |
  426. | sum | 1.1355371575336903 | 1.1217534774914384 | 1.1975146364420652 | 1.2145597609924152 | {'data': (10000, 100), 'axis': 0} |
  427. | sum_axis | 0.7223967200843617 | 0.7208095048554242 | 0.731719535542652 | 0.7410854537738487 | {'data': (1024, 1024), 'axis': 0} |
  428. | sum_axis | 0.15999175899196416 | 0.15863249427638948 | 0.16325038741342723 | 0.1834952272474766 | {'data': (10000, 1), 'axis': 0} |
  429. | sum_axis | 0.5440668168012053 | 0.5402109818533063 | 0.5535335862077773 | 0.5668640608200809 | {'data': (10000, 100), 'axis': 0} |
  430. | swapaxes | 0.9924115432659164 | 0.989955005934462 | 1.0007397853769362 | 1.0162075079279023 | {'data': (1024, 1024), 'dim1': 0, 'dim2': 1} |
  431. | swapaxes | 0.07273984316270798 | 0.07225549779832363 | 0.07456080638803542 | 0.08526973484549677 | {'data': (10000, 1), 'dim1': 0, 'dim2': 1} |
  432. | swapaxes | 0.6747546826954931 | 0.667943008011207 | 0.6811622180975974 | 0.6973335595102997 | {'data': (10000, 100), 'dim1': 0, 'dim2': 1} |
  433. | tan | 0.9462300024461001 | 0.9201165230479091 | 0.9627956082113087 | 1.6040336276637392 | {'data': (1024, 1024)} |
  434. | tan | 0.1459797687130049 | 0.14386046677827835 | 0.15028158668428662 | 0.1709019392728808 | {'data': (10000, 1)} |
  435. | tan | 0.9031887154560536 | 0.8793474698904902 | 0.9208405157551169 | 1.5756346081616361 | {'data': (10000, 100)} |
  436. | tanh | 1.212542331777513 | 1.1678790033329278 | 1.1979737086221576 | 1.8882874405244447 | {'data': (1024, 1024)} |
  437. | tanh | 0.14697391190566123 | 0.14421099331229925 | 0.15503690810874104 | 0.1717891352018345 | {'data': (10000, 1)} |
  438. | tanh | 1.1557233601342887 | 1.122691493947059 | 1.2203327962197363 | 1.8952788511523977 | {'data': (10000, 100)} |
  439. | topk | 16.16629035153892 | 15.62795348581858 | 16.079789574723716 | 21.275094599695876 | {'data': (1024, 1024), 'axis': 0, 'k': 1} |
  440. | topk | 0.26486523915082216 | 0.2640694729052484 | 0.271600327687338 | 0.2847644011490048 | {'data': (10000, 1), 'axis': 0, 'k': 1} |
  441. | topk | 12.848319489858113 | 12.81245198333636 | 12.82717392896302 | 13.628345073666436 | {'data': (10000, 100), 'axis': 0, 'k': 1} |
  442. | transpose | 0.451170543092303 | 0.44855347368866205 | 0.4588026145938784 | 0.502436738461256 | {'data': (1024, 1024)} |
  443. | transpose | 0.052988395327702165 | 0.05234251148067415 | 0.055088428780436516 | 0.06395845150109386 | {'data': (10000, 1)} |
  444. | transpose | 0.11369565618224442 | 0.10986448614858091 | 0.11534836958162487 | 0.14422575477510804 | {'data': (10000, 100)} |
  445. | trunc | 0.24715179984923452 | 0.24608153034932911 | 0.25167010026052594 | 0.2611895825248212 | {'data': (1024, 1024)} |
  446. | trunc | 0.08873845275957137 | 0.08789150160737336 | 0.0896796234883368 | 0.10015697916969664 | {'data': (10000, 1)} |
  447. | trunc | 0.23787261627148837 | 0.23694548872299492 | 0.2420982636976987 | 0.25115444324910646 | {'data': (10000, 100)} |
  448. | zeros_like | 0.06554204039275646 | 0.06491554086096585 | 0.06795240333303809 | 0.07773643883410845 | {'data': (1024, 1024)} |
  449. | zeros_like | 0.04205502104014158 | 0.041833496652543545 | 0.042585161281749606 | 0.04864785005338494 | {'data': (10000, 1)} |
  450. | zeros_like | 0.06647260917816311 | 0.06549249519594014 | 0.0683383725117892 | 0.0909782981034369 | {'data': (10000, 100)} |
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement