{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T02:19:15Z","timestamp":1771467555298,"version":"3.50.1"},"reference-count":47,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,1]]},"DOI":"10.1109\/wacv.2019.00015","type":"proceedings-article","created":{"date-parts":[[2019,3,7]],"date-time":"2019-03-07T19:19:06Z","timestamp":1551986346000},"page":"71-80","source":"Crossref","is-referenced-by-count":32,"title":["Where to Focus on for Human Action Recognition?"],"prefix":"10.1109","author":[{"given":"Srijan","family":"Das","sequence":"first","affiliation":[]},{"given":"Arpit","family":"Chaudhary","sequence":"additional","affiliation":[]},{"given":"Francois","family":"Bremond","sequence":"additional","affiliation":[]},{"given":"Monique","family":"Thonnat","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.683"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref33","first-page":"1","article-title":"Deep multimodal feature analysis for action recognition in rgb+d videos","author":"shahroudy","year":"2017","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.115"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.167"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298860"},{"key":"ref37","volume":"12","author":"soomro","year":"2012","journal-title":"Ucf101 A Dataset of 101 Human Actions Classes from Videos in the Wild"},{"key":"ref36","first-page":"4263","article-title":"An end-to-end spatio-temporal attention model for human action recognition from skeleton data","author":"song","year":"2017","journal-title":"AAAI Conference on Artificial Intelligence"},{"key":"ref35","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref34","article-title":"Action recognition using visual attention","author":"sharma","year":"2015"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.213"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995407"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2014.772"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.333"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref14","first-page":"5","volume":"1","author":"hogg","year":"1983","journal-title":"Model-based Vision A Program to See a Walking Person Image and Vision Computing"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299172"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2640292"},{"key":"ref17","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2014","journal-title":"CoRR abs\/1412 6980"},{"key":"ref18","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"NIPS"},{"key":"ref19","first-page":"1","article-title":"Learning realistic human actions from movies","author":"laptev","year":"2008","journal-title":"Computer Vision and Pattern Recognition 2008 CVPR 2008 IEEE Conference"},{"key":"ref28","first-page":"143","article-title":"Improving the fisher kernel for large-scale image classification","author":"perronnin","year":"2010","journal-title":"European Conference on Computer Vision"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref27","first-page":"2204","article-title":"Recurrent models of visual attention","volume":"2","author":"mnih","year":"2014","journal-title":"Proceedings of the 27th International Conference on Neural Information Processing Systems"},{"key":"ref3","article-title":"Glimpse clouds: Human activity recognition from unstructured feature points","author":"baradel","year":"2018","journal-title":"The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.368"},{"key":"ref29","first-page":"588","article-title":"Human action recognition by representing 3d skeletons as points in a lie group","author":"v r","year":"2014","journal-title":"2014 IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref5","article-title":"Return of the devil in the details: Delving deep into convolutional nets","author":"chatfield","year":"2014","journal-title":"British Machine Vision Conference"},{"key":"ref8","article-title":"A Fusion of Appearance based CNNs and Temporal evolution of Skeleton with LSTM for Daily Living Action Recognition","author":"das","year":"2018","journal-title":"ArXiv e-prints"},{"key":"ref7","author":"chollet","year":"2015","journal-title":"Keras"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.77"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298878"},{"key":"ref1","author":"abadi","year":"2015","journal-title":"TensorFlow Large-Scale Machine Learning on Heterogeneous Systems"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.347"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.115"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2017.24"},{"key":"ref22","first-page":"2855","article-title":"Discriminative virtual views for cross-view action recognition","author":"li","year":"2012","journal-title":"2012 IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.316"},{"key":"ref21","first-page":"1362","article-title":"Cross-view activity recognition using hankelets","author":"li","year":"2012","journal-title":"2012 IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2018.05.029"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.391"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.339"},{"key":"ref23","doi-asserted-by":"crossref","first-page":"816","DOI":"10.1007\/978-3-319-46487-9_50","article-title":"Spatio-temporal lstm with trust gates for 3d human action recognition","author":"liu","year":"2016","journal-title":"editors Computer Vision - ECCV 2016"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.233"},{"key":"ref26","article-title":"Recognizing human actions as the evolution of pose estimation maps","author":"liu","year":"2018","journal-title":"The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref43","article-title":"End-to-end learning of action detection from frame glimpses in videos","author":"yeung","year":"2015"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2017.02.030"}],"event":{"name":"2019 IEEE Winter Conference on Applications of Computer Vision (WACV)","location":"Waikoloa Village, HI, USA","start":{"date-parts":[[2019,1,7]]},"end":{"date-parts":[[2019,1,11]]}},"container-title":["2019 IEEE Winter Conference on Applications of Computer Vision (WACV)"],"original-title":[],"link":[{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/http\/xplorestaging.ieee.org\/ielx7\/8642793\/8658235\/08658564.pdf?arnumber=8658564","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,19]],"date-time":"2022-07-19T16:23:43Z","timestamp":1658247823000},"score":1,"resource":{"primary":{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/ieeexplore.ieee.org\/document\/8658564\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,1]]},"references-count":47,"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.1109\/wacv.2019.00015","relation":{},"subject":[],"published":{"date-parts":[[2019,1]]}}}