SHARE
TWEET

bibs

mahmoodn Aug 14th, 2019 162 Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
  1. @article{Nickolls08,
  2.  author = {J. Nickolls and I. Buck and M. Garland and K. Skadron},
  3.  title = {Scalable Parallel Programming with CUDA},
  4.  journal = {ACM Queue},
  5.  volume = {6},
  6.  number = {2},
  7.  year = {2008},
  8.  pages = {40-53},
  9. }
  10. @article{wen18,
  11. author = {Wen, Zeyi and Shi, Jiashuai and Li, Qinbin and He, Bingsheng and Chen, Jian},
  12. title = {{ThunderSVM}: A Fast {SVM} Library on {GPUs} and {CPUs}},
  13. journal = {Journal of Machine Learning Research},
  14. volume={19},
  15. pages={1--5},
  16. year = {2018}
  17. }
  18. @article{Lindholm08,
  19.  author = {E. Lindholm and J. Nickolls and S. Oberman and J. Montrym},
  20.  title = {NVIDIA Tesla: A Unified Graphics and Computing Architecture},
  21.  journal = {IEEE Micro},
  22.  volume = {28},
  23.  number = {2},
  24.  year = {2008},
  25.  pages = {39-55},
  26. }
  27. @article{Abraham15,
  28.  author = { M. J. Abraham and T. Murtola and R. Schulz and S. Pall and J. C. Smith and B. Hess and E. Lindahl},
  29.  title = {GROMACS: High Performance Molecular Simulations Through Multi-level Parallelism from Laptops to Supercomputers},
  30.  journal = { SoftwareX},
  31.  volume = {1-2},
  32.  year = {2015},
  33.  pages = {19-25},
  34. }
  35. @article{Brown12,
  36.  author = { W. M. Brown and A. Kohlmeyer and S. J. Plimpton and A. N. Tharrington},
  37.  title = {Implementing Molecular Dynamics on Hybrid High Performance Computers – Particle–particle Particle-mesh},
  38.  journal = { Computer Physics Communications},
  39.  volume = {183},
  40.  number = {3},
  41.  year = {2012},
  42.  pages = {449-459},
  43. }
  44. @article{Phillips05,
  45.  author = { J. C. Phillips and R. Braun and W. Wang and J. Gumbart and E. Tajkhorshid and E. Villa and C. Chipot and R. D. Skeel and L. Kale and K. Schulten },
  46.  title = {Scalable Molecular Dynamics with NAMD},
  47.  journal = {Journal of Computational Chemistry},
  48.  volume = {26},
  49.  number = {16},
  50.  year = {2005},
  51.  pages = {1781-1802},
  52. }
  53. @article{Wang17,
  54.  author = { Y. Wang and P. Yangzihao and A. Davidson and Y. Wu and C. Yang and L. Wang and M. Osama and C. Yuan and W. Liua and A. T. Riffel and J. D. Owens},
  55.  title = {Gunrock: GPU Graph Analytics},
  56.  journal = {ACM Transactions on Parallel Computing},
  57.  volume = {4},
  58.  number = {2},
  59.  year = {2017},
  60. }
  61. @article{Pieters07,
  62.  author = { B. Pieters and D. Van Rijsselbergen and W. De Neve and R. Van de Walle},
  63.  title = {Performance Evaluation of H.264/AVC Decoding and Visualization Using the GPU},
  64.  journal = {Applications of Digital Image Processing XXX},
  65.  volume = {6696},
  66.  year = {2007},
  67. }
  68. @article{Chetlur14,
  69.  author = {S. Chetlur and C. Woolley and P. Vandermersch and J. Cohen and J. Tran and B. Catanzaro and E. Shelhamer},
  70.  title = {cuDNN: Efficient Primitives for Deep Learning},
  71.  journal = {arXiv preprint arXiv:1410.0759},
  72.  year = {2014},
  73. }
  74. @article{Jorda19,
  75.  author = { M. Jorda and P. Valero-Lara and A. J. Peña },
  76.  title = {Performance Evaluation of cuDNN Convolution Algorithms on NVIDIA Volta GPUs },
  77.  journal = { IEEE Access},
  78.  volume = {7},
  79.  number = {2},
  80.  year = {2019},
  81.  pages = {70461 - 70473},
  82. }
  83.  
  84.  
  85.  
  86.  
  87.  
  88.  
  89.  
  90.  
  91.  
  92. @misc{spec,
  93. title={SPEC CPU 2017},
  94. url={https://www.spec.org/cpu2017/},
  95. note={(2018)},
  96. }
  97. @misc{xmrig18,
  98. title={XMRig NVIDIA Miner},
  99. url={https://github.com/xmrig/xmrig-nvidia},
  100. note={(2018)},
  101. }
  102. @misc{RCSB,
  103. title={Research Collaboratory for Structural Bioinformatics (RCSB)},
  104. url={https://www.rcsb.org/structure/1ao6},
  105. note={(2018)},
  106. }
  107. @misc{ffmpeg18,
  108. title={FFmpeg: A complete, cross-platform solution to record, convert and stream audio and video},
  109. url={https://ffmpeg.org},
  110. note={(2018)},
  111. }
  112. @misc{racon19,
  113. title={Ultrafast consensus module for raw de novo genome assembly of long uncorrected reads},
  114. url={https://github.com/clara-genomics/racon-gpu},
  115. note={(2019)},
  116. }
  117. @misc{thunder19,
  118. title={ThunderSVM: A Fast SVM Library on GPUs and CPUs },
  119. url={https://github.com/Xtra-Computing/thundersvm},
  120. note={(2019)},
  121. }
  122. @misc{bsd,
  123. title={The Berkeley Segmentation Dataset and Benchmark},
  124. url={https://www2.eecs.berkeley.edu/Research/Projects/CS/vision/bsds},
  125. note={(2019)},
  126. }
  127. @misc{optix18,
  128. title={NVIDIA OptiX Rat Tracing Engine},
  129. url={https://developer.nvidia.com/optix},
  130. note={(2018)},
  131. }
  132. @misc{advoptix,
  133. title={OptiX Advanced Samples},
  134. url={https://github.com/nvpro-samples/optix_advanced_samples},
  135. note={(2018)},
  136. }
  137. @misc{Nsight18,
  138. title={NVIDIA Nsight Visual Studio Edition},
  139. url={https://docs.nvidia.com/gameworks/content/developertools/desktop/analysis/report/cudaexperiments/kernellevel/achievedflops.htm},
  140. note={(2018)},
  141. }
  142. @misc{shoc18,
  143. title={The Scalable HeterOgeneous Computing (SHOC) benchmark suite},
  144. url={https://github.com/vetter/shoc},
  145. note={(2018)},
  146. }
  147. @misc{3dm,
  148. title={The Gamer's Benhcmark},
  149. url={https://www.3dmark.com},
  150. note={(2018)},
  151. }
  152. @misc{passm,
  153. title={Benchmarking \& Diagnostic Software},
  154. url={https://www.passmark.com},
  155. note={(2018)},
  156. }
  157. @misc{deepb,
  158. title={Benchmarking Deep Learning operations on different hardware},
  159. url={https://github.com/baidu-research/DeepBench},
  160. note={(2018)},
  161. }
  162. @misc{mdb,
  163. title={MDBenchmark: Benchmark molecular dynamics simulations},
  164. url={https://mdbenchmark.readthedocs.io},
  165. note={(2018)},
  166. }
  167. @misc{mlperf,
  168. title={Fair and useful benchmarks for measuring training and inference performance of ML hardware, software, and services},
  169. url={https://mlperf.org},
  170. note={(2019)},
  171. }
  172. @misc{skin,
  173. title={ Skin Segmentation Data Set },
  174. url={https://archive.ics.uci.edu/ml/datasets/skin+segmentation},
  175. note={(2019)},
  176. }
  177.  
  178.  
  179.  
  180. @techrepor{Stratton12,
  181.  author = { J. A. Stratton and C. Rodrigues and I. Sung and N. Obeid and L. Chang and N. Anssari and G. D. Liu and W. W Hwu},
  182.  title = {Parboil: A Revised Benchmark Suite for Scientific and Commercial Throughput Computing},
  183.  number =  {IMPACT-12-01},
  184.  institution = {Center for Reliable and High-Performance Computing, University of Illinois at Urbana-Champaign}
  185.  year = {2012},
  186. }
  187.  
  188.  
  189.  
  190. @inproceedings{Ferdman12,
  191.  author = {M. Ferdman and A. Adileh and O. Kocberber and S. Volos and M. Alisafaee and D. Jevdjic and C. Kaynak and A. D. Popescu and A. Ailamaki and B. Falsafi},
  192.  title = {Clearing the Clouds: A Study of Emerging Scale-out Workloads on Modern Hardware},
  193.  booktitle  = {Proceeding of Conference on Architectural Support for Programming Languages and Operating Systems },
  194.  year = {2012},
  195.  pages = {37-48},  
  196. }
  197. @inproceedings{Ryoo15,
  198.  author = { J. H. Ryoo and S. J. Quirem and M. Lebeane and R. Panda and S. Song and L. K. John },
  199.  title = {GPGPU Benchmark Suites: How Well Do They Sample the Performance Spectrum?},
  200.  booktitle  = {Proceeding of Conference on Parallel Processing },
  201.  year = {2015},
  202.  pages = {320 - 329},  
  203. }
  204. @inproceedings{Bienia08,
  205.  author = {C. Bienia and S. Kumar and J. P. Singh and K. Li},
  206.  title = {The PARSEC Benchmark Suite: Characterization and Architectural Implications},
  207.  booktitle  = {Proceeding of Conference on Parallel Architectures and Compilation Techniques },
  208.  year = {2008},
  209.  pages = {72-81},  
  210. }
  211. @inproceedings{Dev14,
  212.  author = {J. A. Dev},
  213.  title = {Bitcoin Mining Acceleration and Performance Quantification},
  214.  booktitle  = {Proceeding of Canadian Conference on Electrical and Computer Engineering},
  215.  year = {2014},
  216. }
  217. @inproceedings{Kim14,
  218.  author = {Y. Kim},
  219.  title = {Convolutional Neural Networks for Sentence Classification},
  220.  booktitle  = {Proceeding of Conference on Empirical Methods in Natural Language Processing},
  221.  year = {2014},
  222.  pages = {1746–1751},
  223. }
  224. @inproceedings{Amodei16,
  225.  author = {D. Amodei and R. Anubhai and E. Battenberg and C. Case and J. Casper and B. Catanzaro and J. Chen and M. Chrzanowski and A. Coates and G. Diamos and E. Elsen and J. Engel and L. Fan and C. Fougner and T. Han and A. Hannun and B. Jun and P. LeGresley and L. Lin and S. Narang and A. Ng and S. Ozair and R. Prenger and J. Raiman and S. Satheesh and D. Seetapun and S. Sengupta and Y. Wang and Z. Wang and C. Wang and B. Xiao and D. Yogatama and J. Zhan and Z. Zhu},
  226.  title = {Deep Speech 2: End-to-End Speech Recognition in English and Mandarin},
  227.  booktitle  = {Proceeding of Conference on Machine Learning},
  228.  year = {2016},
  229.  pages = {173-182},
  230. }
  231. @inproceedings{Playne09,
  232.  author = {D. P. Playne and M. Johnson and K. A. Hawick},
  233.  title = {Benchmarking GPU Devices with N-Body Simulations},
  234.  booktitle  = {Proceeding of Conference on Computer Design},
  235.  year = {2009},
  236.  pages = {150-156},
  237. }
  238. @inproceedings{Dong17,
  239.  author = {S. Dong and D. Kaeli},
  240.  title = {DNNMark: A Deep Neural Network Benchmark Suite for GPUs},
  241.  booktitle  = {Proceeding of the General Purpose GPUs},
  242.  year = {2017},
  243.  pages = {63-72},
  244. }
  245. @inproceedings{Burtscher12,
  246.  author = {M. Burtscher and R. Nasre and K. Pingali},
  247.  title = {A Quantitative Study of Irregular Programs on GPUs},
  248.  booktitle  = {Proceedings of Symposium on Workload Characterization},
  249.  year = {2012},
  250. }
  251. @inproceedings{Xu14,
  252.  author = {Q. Xu and H. Jeon and M. Annavaram},
  253.  title = {Graph Processing on GPUs: Where are the Bottlenecks?},
  254.  booktitle  = {Proceedings of Symposium on Workload Characterization},
  255.  year = {2014},
  256. }
  257. @inproceedings{Shi16,
  258.  author = {S. Shi and Q. Wang and P. Xu and X. Chu},
  259.  title = {Benchmarking State-of-the-Art Deep Learning Software Tools},
  260.  booktitle  = {Proceedings of Conference on Cloud Computing and Big Data},
  261.  year = {2016},
  262. }
  263. @inproceedings{Kulkarni09,
  264.  author = {M. Kulkarni and M. Burtscher and C. Cascaval and K. Pingali},
  265.  title = {Lonestar: A Suite of Parallel Irregular Programs},
  266.  booktitle  = {Proceeding of Symposium on Performance Analysis of Systems and Software},
  267.  year = {2009},
  268. }
  269. @inproceedings{Volkov10,
  270.  author = { V. Volkov},
  271.  title = {Better Performance at Lower Occupancy},
  272.  booktitle  = {Proceedings of the GPU Technology Conference},
  273.  year = {2010},
  274. }
  275. @inproceedings{optix10,
  276.  author = { S. G. Parker},
  277.  title = {OptiX: A General Purpose Ray Tracing Engine},
  278.  booktitle  = {Proceeding of ACM SIGGRAPH},
  279.  year = {2010},
  280.  pages = {66:1–66:13},
  281. }
  282. @inproceedings{Chen15,
  283.  author = { T. Chen and M. Li and Y. Li and M. Lin and N. Wang and M. Wang and T. Xiao and B. Xu and C. Zhang and Z. Zhang},
  284.  title = {MXNet: A Flexible and Efficient Machine Learning Library for Heterogeneous Distributed Systems},
  285.  booktitle  = {Proceeding of Neural Information Processing Systems, Workshop on Machine Learning Systems},
  286.  year = {2015},
  287. }
  288. @inproceedings{Paszke17,
  289.  author = {A. Paszke and S. Gross and S. Chintala and G. Chanan and E. Yang and Z. DeVito and Z. Lin and A. Desmaison and L. Antiga and A. Lerer},
  290.  title = {Automatic Differentiation in PyTorch},
  291.  booktitle  = {NIPS Autodiff Workshop},
  292.  year = {2017},
  293. }
  294. @inproceedings{Abadi16,
  295.  author = { M. Abadi and P. Barham and J. Chen and Z. Chen and A. Davis and J. Dean and M. Devin and S. Ghemawat and G. Irving and M. Isard and M. Kudlur and J. Levenberg and R. Monga and S. Moore and D. G. Murray and B. Steiner and P. Tucker and V. Vasudevan and P. WardenM. Abadi and P. Barham and J. Chen and Z. Chen and A. Davis and J. Dean and M. Devin and S. Ghemawat and G. Irving and M. Isard and M. Kudlur and J. Levenberg and R. Monga and S. Moore and D. G. Murray and B. Steiner and P. Tucker and V. Vasudevan and P. Warden and M. Wicke and Y. Yu and X. Zheng M. Wicke and Y. Yu and X. Zheng},
  296.  title = {TensorFlow: A System for Large-scale Machine Learning},
  297.  booktitle  = {Proceedings of USENIX conference on Operating Systems Design and Implementation},
  298.  year = {2016},
  299.  pages = {265-283},
  300. }
  301. @inproceedings{Bakhoda09,
  302.  author = { A. Bakhoda and G. Yuan and W. Fung and H. Wong and T. M. Aamodt},
  303.  title = {Analyzing CUDA Workloads Using a Detailed GPU Simulator},
  304.  booktitle  = {Proceedings of Symposium on Performance Analysis of Systems and Software},
  305.  year = {2009},
  306.  pages = {163-174},
  307. }
  308. @inproceedings{Che09,
  309.  author = { S. Che and M. Boyer and J. Meng and D. Tarjan and J. W. Sheaffer and S.-H. Lee and K. Skadron},
  310.  title = {Rodinia: A Benchmark Suite for Heterogeneous Computing},
  311.  booktitle  = {Proceedings of Symposium on Workload Characterization},
  312.  year = {2009},
  313.  pages = {44-54 },
  314. }
  315. @inproceedings{Shi16,
  316.  author = { W. Shi and J. Caballero and F. Huszár and J. Totz and A. P. Aitken and R. Bishop and D. Rueckert and Z. Wang },
  317.  title = { Real-Time Single Image and Video Super-Resolution Using an Efficient Sub-Pixel Convolutional Neural Network },
  318.  booktitle  = {Proceedings of Conference on Computer Vision and Pattern Recognition},
  319.  year = {2016},
  320.  pages = {1874 - 1883},
  321. }
  322. @inproceedings{Volkov08,
  323.  author = { V. Volkov and J. W. Demmel},
  324.  title = {Benchmarking GPUs to Tune Dense Linear Algebra},
  325.  booktitle  = {Proceedings of Internation Conference on Supercomputing},
  326.  year = {2008},
  327.  pages = { 1-11 },
  328. }
  329. @inproceedings{Xu16,
  330.  author = { Y. Xu and R. Wang and T. Li and M. Song and L. Gao and Z. Luan and D. Qian},
  331.  title = {Scheduling Tasks with Mixed Timing Constraints in GPU-Powered Real-Time Systems},
  332.  booktitle  = {Proceedings of Conference on Supercomputing},
  333.  year = {2016},
  334. }
  335. @inproceedings{Ravi11,
  336.  author = { V. T. Ravi and M. Becchi and G. Agrawal and S. Chakradhar},
  337.  title = {Supporting GPU Sharing in Cloud Environments with a Transparent Runtime Consolidation Framework},
  338.  booktitle  = {Proceedings of Symposium on High Performance Distributed Computing},
  339.  year = {2011},
  340.  pages = { 217-228},
  341. }
  342. @inproceedings{Li15,
  343.  author = { P. Li and Y. Luo and N. Zhang and Y. Cao},
  344.  title = {HeteroSpark: A Heterogeneous CPU/GPU Spark Platform for Machine Learning Algorithms},
  345.  booktitle  = {Proceedings of Conference on Networking, Architecture and Storage},
  346.  year = {2015},
  347.  pages = { 347-348 },
  348. }
  349. @inproceedings{Cui16,
  350.  author = { H. Cui and H. Zhang and G. R. Ganger and P. B. Gibbons and E. P. Xing},
  351.  title = {GeePS: scalable deep learning on distributed GPUs with a GPU-specialized parameter server},
  352.  booktitle  = {Proceedings of European Conference on Computer Systems},
  353.  year = {2016},
  354. }
RAW Paste Data
We use cookies for various purposes including analytics. By continuing to use Pastebin, you agree to our use of cookies as described in the Cookies Policy. OK, I Understand
Not a member of Pastebin yet?
Sign Up, it unlocks many cool features!
 
Top