{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,26]],"date-time":"2026-06-26T05:35:11Z","timestamp":1782452111844,"version":"3.54.5"},"reference-count":23,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[1994,3,1]],"date-time":"1994-03-01T00:00:00Z","timestamp":762480000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Neural Netw."],"published-print":{"date-parts":[[1994,3]]},"DOI":"10.1109\/72.279181","type":"journal-article","created":{"date-parts":[[2002,8,24]],"date-time":"2002-08-24T19:16:32Z","timestamp":1030216592000},"page":"157-166","source":"Crossref","is-referenced-by-count":6684,"title":["Learning long-term dependencies with gradient descent is difficult"],"prefix":"10.1109","volume":"5","author":[{"given":"Y.","family":"Bengio","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"P.","family":"Simard","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"P.","family":"Frasconi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.1989.118276"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/NNSP.1992.253712"},{"key":"ref12","first-page":"73","article-title":"Learning by choice of internal representation","volume":"1","author":"grossman","year":"0","journal-title":"Neural Information Processing Systems"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"671","DOI":"10.1126\/science.220.4598.671","article-title":"Optimization by simulated annealing","volume":"220","author":"kirkpatrick","year":"1983","journal-title":"Science"},{"key":"ref14","author":"kuhn","year":"1987","journal-title":"A first look at phonetic discrimination using connectionist models with recurrent links"},{"key":"ref15","author":"lang","year":"1988","journal-title":"The development of the time-delay neural network architecture for speech recognition"},{"key":"ref16","doi-asserted-by":"crossref","first-page":"233","DOI":"10.1007\/978-3-642-82657-3_24","author":"le cun","year":"1986","journal-title":"Disordered Systems and Biological Organization"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/0167-2789(91)90236-3"},{"key":"ref18","first-page":"349","article-title":"A focused back-propagation algorithm for temporal pattern recognition","volume":"3","author":"mozer","year":"1989","journal-title":"Complex Systems"},{"key":"ref19","first-page":"275","volume":"4","author":"mozer","year":"1992","journal-title":"Advances in neural information processing systems"},{"key":"ref4","author":"bengio","year":"1991","journal-title":"Artificial neural networks and their application to sequence recognition"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICNN.1993.298725"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/29380.29864"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/72.125866"},{"key":"ref8","article-title":"Unified integration of explicit rules and learning by example in recurrent networks","author":"frasconi","year":"0","journal-title":"IEEE Trans on Knowledge and Data Engineering"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1992.4.1.120"},{"key":"ref2","first-page":"29","article-title":"Improving the convergence of backpropagation learning with second order methods","author":"becker","year":"0","journal-title":"Proceedings of the 1988 Connectionist Models Summer School"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/72.125861"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICNN.1993.298832"},{"key":"ref20","author":"ortega","year":"1960","journal-title":"Iterative Solution of Non-linear Equations in Several Variables and Systems of Equations"},{"key":"ref22","first-page":"318","volume":"1","author":"rumelhart","year":"1986","journal-title":"Parallel Distributed Processing"},{"key":"ref21","first-page":"558","volume":"2","author":"rohwer","year":"1990","journal-title":"Advances in neural information processing systems"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1989.1.2.270"}],"container-title":["IEEE Transactions on Neural Networks"],"original-title":[],"link":[{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/http\/xplorestaging.ieee.org\/ielx4\/72\/6922\/00279181.pdf?arnumber=279181","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,11,29]],"date-time":"2021-11-29T20:14:03Z","timestamp":1638216843000},"score":1,"resource":{"primary":{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/ieeexplore.ieee.org\/document\/279181\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1994,3]]},"references-count":23,"journal-issue":{"issue":"2"},"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.1109\/72.279181","relation":{},"ISSN":["1045-9227","1941-0093"],"issn-type":[{"value":"1045-9227","type":"print"},{"value":"1941-0093","type":"electronic"}],"subject":[],"published":{"date-parts":[[1994,3]]}}}