{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T00:50:28Z","timestamp":1740099028638,"version":"3.37.3"},"publisher-location":"Cham","reference-count":18,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319733524"},{"type":"electronic","value":"9783319733531"}],"license":[{"start":{"date-parts":[[2017,12,28]],"date-time":"2017-12-28T00:00:00Z","timestamp":1514419200000},"content-version":"unspecified","delay-in-days":0,"URL":"https:\/\/2.zoppoz.workers.dev:443\/http\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-73353-1_5","type":"book-chapter","created":{"date-parts":[[2017,12,27]],"date-time":"2017-12-27T05:45:34Z","timestamp":1514353534000},"page":"71-86","update-policy":"https:\/\/2.zoppoz.workers.dev:443\/https\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Analysis and Characterization of GPU Benchmarks for Kernel Concurrency Efficiency"],"prefix":"10.1007","author":[{"given":"Pablo","family":"Carvalho","sequence":"first","affiliation":[]},{"given":"L\u00facia M. A.","family":"Drummond","sequence":"additional","affiliation":[]},{"given":"Cristiana","family":"Bentes","sequence":"additional","affiliation":[]},{"given":"Esteban","family":"Clua","sequence":"additional","affiliation":[]},{"given":"Edson","family":"Cataldo","sequence":"additional","affiliation":[]},{"given":"Leandro A. J.","family":"Marzulo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,12,28]]},"reference":[{"key":"5_CR1","doi-asserted-by":"crossref","unstructured":"Che, S., Boyer, M., Meng, J., Tarjan, D., Sheaffer, J.W., Lee, S.-H., Skadron, K.: Rodinia: a benchmark suite for heterogeneous computing. In: Proceedings of the IEEE International Symposium on Workload Characterization (IISWC), pp. 44\u201354 (2009)","DOI":"10.1109\/IISWC.2009.5306797"},{"key":"5_CR2","unstructured":"Stratton, J.A., Rodrigues, C., Sung, I.-J., Obeid, N., Chang, L.-W., Anssari, N., Liu, G.D., Hwu, W.M.W.: Parboil: a revised benchmark suite for scientific and commercial throughput computing (2012)"},{"key":"5_CR3","doi-asserted-by":"crossref","unstructured":"Danalis, A., Marin, G., McCurdy, C., Meredith, J.S., Roth, P.C., Spafford, K., Tipparaju, V., Vetter, J.S.: The scalable heterogeneous computing (SHOC) benchmark suite. In: Proceedings of the 3rd Workshop on General-Purpose Computation on Graphics Processing Units, pp. 63\u201374 (2010)","DOI":"10.1145\/1735688.1735702"},{"key":"5_CR4","doi-asserted-by":"crossref","unstructured":"Pai, S., Thazhuthaveetil, M.J., Govindarajan, R.: Improving GPGPU concurrency with elastic kernels. In: ACM SIGPLAN Notices, vol. 48, pp. 407\u2013418. ACM (2013)","DOI":"10.1145\/2451116.2451160"},{"key":"5_CR5","doi-asserted-by":"crossref","unstructured":"Che, S., Sheaffer, J.W., Boyer, M., Szafaryn, L.G., Wang, L., Skadron, K.: A characterization of the Rodinia benchmark suite with comparison to contemporary CMP workloads. In: Proceedings of the IEEE International Symposium on Workload Characterization (2010)","DOI":"10.1109\/IISWC.2010.5650274"},{"key":"5_CR6","doi-asserted-by":"crossref","unstructured":"Kerr, A., Diamos, G., Yalamanchili, S.: A characterization and analysis of PTX kernels. In: IEEE International Symposium on Workload Characterization, IISWC 2009, pp. 3\u201312. IEEE (2009)","DOI":"10.1109\/IISWC.2009.5306801"},{"key":"5_CR7","doi-asserted-by":"crossref","unstructured":"Goswami, N., Shankar, R., Joshi, M., Li, T.: Exploring GPGPU workloads: characterization methodology, analysis and microarchitecture evaluation implications. In: 2010 IEEE International Symposium on Workload Characterization (IISWC), pp. 1\u201310. IEEE (2010)","DOI":"10.1109\/IISWC.2010.5649549"},{"key":"5_CR8","doi-asserted-by":"crossref","unstructured":"Burtscher, M., Nasre, R., Pingali, K.: A quantitative study of irregular programs on GPUs. In: 2012 IEEE International Symposium on Workload Characterization (IISWC), pp. 141\u2013151. IEEE (2012)","DOI":"10.1109\/IISWC.2012.6402918"},{"key":"5_CR9","doi-asserted-by":"crossref","unstructured":"O\u2019Neil, M.A., Burtscher, M.: Microarchitectural performance characterization of irregular GPU kernels. In: 2014 IEEE International Symposium on Workload Characterization (IISWC), pp. 130\u2013139. IEEE (2014)","DOI":"10.1109\/IISWC.2014.6983052"},{"key":"5_CR10","doi-asserted-by":"crossref","unstructured":"Bakhoda, A., Yuan, G.L., Fung, W.W., Wong, H., Aamodt, T.M.: Analyzing CUDA workloads using a detailed GPU simulator. In: IEEE International Symposium on Performance Analysis of Systems and Software, ISPASS 2009, pp. 163\u2013174. IEEE (2009)","DOI":"10.1109\/ISPASS.2009.4919648"},{"key":"5_CR11","volume-title":"Benchmarking Modern Multiprocessors","author":"C Bienia","year":"2011","unstructured":"Bienia, C.: Benchmarking Modern Multiprocessors. Princeton University, Princeton (2011)"},{"key":"5_CR12","unstructured":"Asanovic, K.: The landscape of parallel computing research: a view from Berkeley, Technical report UCB\/EECS-2006-183, EECS Department, University of California, Berkley, CA, USA (2006)"},{"key":"5_CR13","unstructured":"SHOC (2012). \nhttps:\/\/2.zoppoz.workers.dev:443\/https\/github.com\/vetter\/shoc\/wiki"},{"key":"5_CR14","unstructured":"NVIDIA Corporation: Profiler user\u2019s guide (2017). \nhttps:\/\/2.zoppoz.workers.dev:443\/http\/docs.nvidia.com\/cuda\/profiler-users-guide\/index.html#nvprof-overview\n\n, an optional note"},{"key":"5_CR15","unstructured":"Bienia, C.: Benchmarking modern multiprocessors, Ph.D. thesis, Princeton University (2011)"},{"issue":"6","key":"5_CR16","doi-asserted-by":"crossref","first-page":"769","DOI":"10.1109\/TC.2006.85","volume":"55","author":"A Joshi","year":"2006","unstructured":"Joshi, A., Phansalkar, A., Eeckhout, L., John, L.K.: Measuring benchmark similarity using inherent program characteristics. IEEE Trans. Comput. 55(6), 769\u2013782 (2006)","journal-title":"IEEE Trans. Comput."},{"issue":"2","key":"5_CR17","doi-asserted-by":"crossref","first-page":"238","DOI":"10.1177\/1094342013507960","volume":"28","author":"S Che","year":"2014","unstructured":"Che, S., Skadron, K.: Benchfriend: correlating the performance of GPU benchmarks. Int. J. High Perform. Comput. Appl. 28(2), 238\u2013250 (2014)","journal-title":"Int. J. High Perform. Comput. Appl."},{"key":"5_CR18","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"122","DOI":"10.1007\/978-3-642-14122-5_16","volume-title":"Euro-Par 2009 \u2013 Parallel Processing Workshops","author":"K Spafford","year":"2010","unstructured":"Spafford, K., Meredith, J., Vetter, J., Chen, J., Grout, R., Sankaran, R.: Accelerating S3D: a GPGPU case study. In: Lin, H.-X., Alexander, M., Forsell, M., Kn\u00fcpfer, A., Prodan, R., Sousa, L., Streit, A. (eds.) Euro-Par 2009. LNCS, vol. 6043, pp. 122\u2013131. Springer, Heidelberg (2010). \nhttps:\/\/2.zoppoz.workers.dev:443\/https\/doi.org\/10.1007\/978-3-642-14122-5_16"}],"container-title":["Communications in Computer and Information Science","High Performance Computing"],"original-title":[],"link":[{"URL":"https:\/\/2.zoppoz.workers.dev:443\/http\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-73353-1_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,12,27]],"date-time":"2017-12-27T05:49:59Z","timestamp":1514353799000},"score":1,"resource":{"primary":{"URL":"https:\/\/2.zoppoz.workers.dev:443\/http\/link.springer.com\/10.1007\/978-3-319-73353-1_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,12,28]]},"ISBN":["9783319733524","9783319733531"],"references-count":18,"URL":"https:\/\/2.zoppoz.workers.dev:443\/https\/doi.org\/10.1007\/978-3-319-73353-1_5","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2017,12,28]]}}}