{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,18]],"date-time":"2025-11-18T12:15:25Z","timestamp":1763468125542},"reference-count":21,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013,6]]},"DOI":"10.1109\/asap.2013.6567597","type":"proceedings-article","created":{"date-parts":[[2013,8,1]],"date-time":"2013-08-01T20:13:23Z","timestamp":1375388003000},"page":"321-328","source":"Crossref","is-referenced-by-count":4,"title":["GPU acceleration of Data Assembly in Finite Element Methods and its energy implications"],"prefix":"10.1109","author":[{"given":"Li","family":"Tang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"X. Sharon","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Danny Z.","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michael","family":"Niemier","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Richard F.","family":"Barrett","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Simon D.","family":"Hammond","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Genie","family":"Hsieh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"19","article-title":"Power and performance analysis of GPU-accelerated systems","author":"abe","year":"2012","journal-title":"Hotpower08"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1145\/2427023.2427027"},{"key":"18","article-title":"High performance parallel jpeg2000 streaming decoder using gpgpu-cpu heterogeneous systempp","author":"le","year":"2012","journal-title":"International Conference on Application-specific Systems Architectures and Processors"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1002\/cav.24"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1016\/j.jpdc.2009.01.006"},{"journal-title":"GPU-accelerated Preconditioned Iterative Linear Solvers","year":"2010","author":"li","key":"13"},{"key":"14","first-page":"1","article-title":"Finite element assembly strategies on multi-and many-core architectures","author":"markall","year":"2011","journal-title":"International Journal for Numerical Methods in Fluids"},{"key":"11","first-page":"1","article-title":"3-D parallel conjugate gradient solver optimized for GPUs","author":"carvalho","year":"2010","journal-title":"Proc 14th Biennial IEEE Conf Electromagnetic Field Comp"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1109\/LMWC.2010.2089974"},{"journal-title":"Dataflow-Driven GPU Performance Projection for Multi-Kernel Transformations","year":"2012","author":"meng","key":"21"},{"journal-title":"Nvidia's Next Generation CUDA Compute Architecture Fermi","year":"2009","key":"3"},{"journal-title":"Summary of Work for ASC L2 Milestone 4465 Characterize the Role of the Mini-Application in Predicting Key Performance Characteristics of Real Applications","year":"2012","author":"barrett","key":"20"},{"journal-title":"Improving Performance Via Mini-applications","year":"2009","author":"heroux","key":"2"},{"year":"0","key":"1"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcp.2010.05.023"},{"key":"7","article-title":"Energy-aware high performance computing with graphics processing units","author":"rofouei","year":"2008","journal-title":"Hotpower08"},{"journal-title":"NVIDIA CUDA C Programming Guide","year":"2011","key":"6"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1002\/nme.2989"},{"journal-title":"NVIDIA's Next Generation CUDA Compute Architecture Kepler GK110","year":"2012","key":"4"},{"journal-title":"VRM 9 0 DC-DC Converter Design Guidelines","year":"2002","key":"9"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2009.5160980"}],"event":{"name":"2013 IEEE 24th International Conference on Application-specific Systems, Architectures and Processors (ASAP)","start":{"date-parts":[[2013,6,5]]},"location":"Washington, DC, USA","end":{"date-parts":[[2013,6,7]]}},"container-title":["2013 IEEE 24th International Conference on Application-Specific Systems, Architectures and Processors"],"original-title":[],"link":[{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/http\/xplorestaging.ieee.org\/ielx7\/6558539\/6567524\/06567597.pdf?arnumber=6567597","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,23]],"date-time":"2017-03-23T03:26:15Z","timestamp":1490239575000},"score":1,"resource":{"primary":{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/http\/ieeexplore.ieee.org\/document\/6567597\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,6]]},"references-count":21,"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.1109\/asap.2013.6567597","relation":{},"subject":[],"published":{"date-parts":[[2013,6]]}}}