{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T19:01:30Z","timestamp":1754161290921,"version":"3.41.2"},"publisher-location":"New York, NY, USA","reference-count":39,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,6,23]]},"DOI":"10.1145\/3696630.3728496","type":"proceedings-article","created":{"date-parts":[[2025,7,28]],"date-time":"2025-07-28T19:10:43Z","timestamp":1753729843000},"page":"545-549","update-policy":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Reduction Fusion for Optimized Distributed Data-Parallel Computations via Inverse Recomputation"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/orcid.org\/0000-0002-9148-5861","authenticated-orcid":false,"given":"Haoxiang","family":"Lin","sequence":"first","affiliation":[{"name":"Microsoft Research, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/orcid.org\/0000-0001-7322-4062","authenticated-orcid":false,"given":"Yang","family":"Wang","sequence":"additional","affiliation":[{"name":"Microsoft Research, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/orcid.org\/0000-0003-1899-8561","authenticated-orcid":false,"given":"Yanjie","family":"Gao","sequence":"additional","affiliation":[{"name":"Microsoft Research, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/orcid.org\/0000-0002-3063-9425","authenticated-orcid":false,"given":"Hongyu","family":"Zhang","sequence":"additional","affiliation":[{"name":"Chongqing University, Chongqing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/orcid.org\/0009-0001-6663-4861","authenticated-orcid":false,"given":"Ming","family":"Wu","sequence":"additional","affiliation":[{"name":"Zero Gravity Labs, San Francisco, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/orcid.org\/0009-0009-6455-3898","authenticated-orcid":false,"given":"Mao","family":"Yang","sequence":"additional","affiliation":[{"name":"Microsoft Research, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,7,28]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Proceedings of the 2022 International Conference on Management of Data","author":"Abeysinghe Supun","year":"2022","unstructured":"Supun Abeysinghe, Qiyang He, and Tiark Rompf. 2022. Efficient Incrementialization of Correlated Nested Aggregate Queries using Relative Partial Aggregate Indexes (RPAI). In Proceedings of the 2022 International Conference on Management of Data (Philadelphia, PA, USA) (SIGMOD '22). Association for Computing Machinery, New York, NY, USA, 136\u2013149. 10.1145\/3514221.3517889"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3416510"},{"key":"e_1_3_2_1_3_1","volume-title":"Proceedings of the 8th USENIX Conference on Operating Systems Design and Implementation","author":"Cadar Cristian","year":"2008","unstructured":"Cristian Cadar, Daniel Dunbar, and Dawson Engler. 2008. KLEE: unassisted and automatic generation of high-coverage tests for complex systems programs. In Proceedings of the 8th USENIX Conference on Operating Systems Design and Implementation (San Diego, California) (OSDI'08). USENIX Association, USA, 209\u2013224."},{"key":"e_1_3_2_1_4_1","volume-title":"Apache Hive: From MapReduce to Enterprise-grade Big Data Warehousing. CoRR abs\/1903.10970","author":"Camacho-Rodr\u00edguez Jes\u00fas","year":"2019","unstructured":"Jes\u00fas Camacho-Rodr\u00edguez, Ashutosh Chauhan, Alan Gates, Eugene Koifman, Owen O'Malley, Vineet Garg, Zoltan Haindrich, Sergey Shelukhin, Prasanth Jayachandran, Siddharth Seth, Deepak Jaiswal, Slim Bouguerra, Nishant Bangarwa, Sankar Hariappan, Anishek Agarwal, Jason Dere, Daniel Dai, Thejas Nair, Nita Dembla, Gopal Vijayaraghavan, and G\u00fcnther Hagleitner. 2019. Apache Hive: From MapReduce to Enterprise-grade Big Data Warehousing. CoRR abs\/1903.10970 (2019). arXiv:1903.10970"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.14778\/1454159.1454166"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6423(90)90042-C"},{"key":"e_1_3_2_1_7_1","volume-title":"Proceedings of the 36th International Conference on Neural Information Processing Systems","author":"Dao Tri","year":"2024","unstructured":"Tri Dao, Daniel Y. Fu, Stefano Ermon, Atri Rudra, and Christopher R\u00e9. 2024. FLASHATTENTION: fast and memory-efficient exact attention with IO-awareness. In Proceedings of the 36th International Conference on Neural Information Processing Systems (New Orleans, LA, USA) (NIPS '22). Curran Associates Inc., Red Hook, NY, USA, Article 1189, 16 pages."},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings of the Theory and Practice of Software, 14th International Conference on Tools and Algorithms for the Construction and Analysis of Systems","author":"Moura Leonardo De","year":"2008","unstructured":"Leonardo De Moura and Nikolaj Bj\u00f8rner. 2008. Z3: An Efficient SMT Solver. In Proceedings of the Theory and Practice of Software, 14th International Conference on Tools and Algorithms for the Construction and Analysis of Systems (Budapest, Hungary) (TACAS '08\/ETAPS '08). Springer-Verlag, Berlin, Heidelberg, 337\u2013340."},{"key":"e_1_3_2_1_9_1","volume-title":"Proceedings of the 19th International Conference on Computer Aided Verification","author":"de Moura Leonardo","year":"2007","unstructured":"Leonardo de Moura, Bruno Dutertre, and Natarajan Shankar. 2007. A Tutorial on Satisfiability modulo Theories. In Proceedings of the 19th International Conference on Computer Aided Verification (Berlin, Germany) (CAV '07). Springer-Verlag, Berlin, Heidelberg, 20\u201336."},{"key":"e_1_3_2_1_10_1","volume-title":"MapReduce: Simplified Data Processing on Large Clusters. In OSDI'04: Sixth Symposium on Operating System Design and Implementation","author":"Dean Jeffrey","year":"2004","unstructured":"Jeffrey Dean and Sanjay Ghemawat. 2004. MapReduce: Simplified Data Processing on Large Clusters. In OSDI'04: Sixth Symposium on Operating System Design and Implementation. San Francisco, CA, 137\u2013150."},{"key":"e_1_3_2_1_11_1","volume-title":"Graph Theory","author":"Diestel Reinhard","unstructured":"Reinhard Diestel. 2017. Graph Theory (5th ed.). Springer Publishing Company, Incorporated.","edition":"5"},{"key":"e_1_3_2_1_12_1","volume-title":"Proceedings of the Eleventh Workshop on Language Descriptions, Tools and Applications","author":"Dom\u00ednguez Facundo","year":"2011","unstructured":"Facundo Dom\u00ednguez and Alberto Pardo. 2011. Exploiting algebra\/coalgebra duality for program fusion extensions. In Proceedings of the Eleventh Workshop on Language Descriptions, Tools and Applications (Saarbrucken, Germany) (LDTA '11). Association for Computing Machinery, New York, NY, USA, Article 6, 8 pages. 10.1145\/1988783.1988789"},{"volume-title":"Elements of Set Theory","author":"Enderton Herbert B.","key":"e_1_3_2_1_13_1","unstructured":"Herbert B. Enderton. 1977. Elements of Set Theory. Academic Press, San Diego."},{"volume-title":"Deep Learning","author":"Goodfellow Ian","key":"e_1_3_2_1_14_1","unstructured":"Ian Goodfellow, Yoshua Bengio, and Aaron Courville. 2016. Deep Learning. MIT Press. https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/http\/www.deeplearningbook.org."},{"key":"e_1_3_2_1_15_1","volume-title":"10th USENIX Symposium on Operating Systems Design and Implementation (OSDI 12)","author":"Guo Zhenyu","year":"2012","unstructured":"Zhenyu Guo, Xuepeng Fan, Rishan Chen, Jiaxing Zhang, Hucheng Zhou, Sean McDirmid, Chang Liu, Wei Lin, Jingren Zhou, and Lidong Zhou. 2012. Spotting Code Optimizations in Data-Parallel Pipelines through PeriSCOPE. In 10th USENIX Symposium on Operating Systems Design and Implementation (OSDI 12). USENIX Association, Hollywood, CA, 121\u2013133. https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/www.usenix.org\/conference\/osdi12\/technical-sessions\/presentation\/guo"},{"key":"e_1_3_2_1_16_1","volume-title":"Proceedings of the 38th ACM SIGPLAN Conference on Programming Language Design and Implementation","author":"Hu Qinheping","year":"2017","unstructured":"Qinheping Hu and Loris D'Antoni. 2017. Automatic program inversion using symbolic transducers. In Proceedings of the 38th ACM SIGPLAN Conference on Programming Language Design and Implementation (Barcelona, Spain) (PLDI 2017). Association for Computing Machinery, New York, NY, USA, 376\u2013389. 10.1145\/3062341.3062345"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1017\/S0956796899003500"},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","author":"Jang Myung-Hwan","year":"2023","unstructured":"Myung-Hwan Jang, Yunyong Ko, Hyuck-Moo Gwon, Ikhyeon Jo, Yongjun Park, and Sang-Wook Kim. 2023. SAGE: A Storage-Based Approach for Scalable and Efficient Sparse Generalized Matrix-Matrix Multiplication. In Proceedings of the 32nd ACM International Conference on Information and Knowledge Management (Birmingham, United Kingdom) (CIKM '23). Association for Computing Machinery, New York, NY, USA, 923\u2013933. 10.1145\/3583780.3615044"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/340855.340964"},{"key":"e_1_3_2_1_20_1","volume-title":"Allen","author":"Kennedy Ken","year":"2001","unstructured":"Ken Kennedy and John R. Allen. 2001. Optimizing compilers for modern architectures: a dependence-based approach. Morgan Kaufmann Publishers Inc., San Francisco, CA, USA."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/360248.360252"},{"key":"e_1_3_2_1_22_1","volume-title":"Proceedings of the ACM Symposium on Cloud Computing","author":"Liu Chang","year":"2014","unstructured":"Chang Liu, Jiaxing Zhang, Hucheng Zhou, Sean McDirmid, Zhenyu Guo, and Thomas Moscibroda. 2014. Automating Distributed Partial Aggregation. In Proceedings of the ACM Symposium on Cloud Computing (Seattle, WA, USA) (SOCC '14). Association for Computing Machinery, New York, NY, USA, 1\u201312. 10.1145\/2670979.2670980"},{"key":"e_1_3_2_1_23_1","volume-title":"Proceedings of the 28th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering","author":"Liu Yu","year":"2020","unstructured":"Yu Liu, Cheng Chen, Ru Zhang, Tingting Qin, Xiang Ji, Haoxiang Lin, and Mao Yang. 2020. Enhancing the Interoperability between Deep Learning Frameworks by Model Conversion. In Proceedings of the 28th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering (Virtual Event, USA) (ESEC\/FSE 2020). Association for Computing Machinery, New York, NY, USA, 1320\u20131330. 10.1145\/3368089.3417051"},{"key":"e_1_3_2_1_24_1","volume-title":"Proceedings of the 19th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming","author":"Mehta Sanyam","year":"2014","unstructured":"Sanyam Mehta, Pei-Hung Lin, and Pen-Chung Yew. 2014. Revisiting loop fusion in the polyhedral framework. In Proceedings of the 19th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming (Orlando, Florida, USA) (PPoPP '14). Association for Computing Machinery, New York, NY, USA, 233\u2013246. 10.1145\/2555243.2555250"},{"key":"e_1_3_2_1_25_1","unstructured":"Microsoft. 2023. Language Integrated Query (LINQ). https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/learn.microsoft.com\/en-us\/dotnet\/csharp\/linq\/."},{"key":"e_1_3_2_1_26_1","volume-title":"Online normalizer calculation for softmax. CoRR abs\/1805.02867","author":"Milakov Maxim","year":"2018","unstructured":"Maxim Milakov and Natalia Gimelshein. 2018. Online normalizer calculation for softmax. CoRR abs\/1805.02867 (2018). arXiv:1805.02867"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.14778\/3503585.3503601"},{"key":"e_1_3_2_1_28_1","volume-title":"Hanne Riis Nielson, and Chris Hankin","author":"Nielson Flemming","year":"2010","unstructured":"Flemming Nielson, Hanne Riis Nielson, and Chris Hankin. 2010. Principles of Program Analysis. Springer Publishing Company, Incorporated."},{"key":"e_1_3_2_1_29_1","unstructured":"NVIDIA. 2024. Hopper Tuning Guide. https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/docs.nvidia.com\/cuda\/pdf\/Hopper_Tuning_Guide.pdf."},{"key":"e_1_3_2_1_30_1","volume-title":"Proceedings of the 2008 ACM SIGMOD International Conference on Management of Data","author":"Olston Christopher","year":"2008","unstructured":"Christopher Olston, Benjamin Reed, Utkarsh Srivastava, Ravi Kumar, and Andrew Tomkins. 2008. Pig latin: a not-so-foreign language for data processing. In Proceedings of the 2008 ACM SIGMOD International Conference on Management of Data (Vancouver, Canada) (SIGMOD '08). Association for Computing Machinery, New York, NY, USA, 1099\u20131110. 10.1145\/1376616.1376726"},{"key":"e_1_3_2_1_31_1","volume-title":"Types and Programming Languages","author":"Pierce Benjamin C.","unstructured":"Benjamin C. Pierce. 2002. Types and Programming Languages (1st ed.). The MIT Press.","edition":"1"},{"key":"e_1_3_2_1_32_1","volume-title":"Catamorphism Generation and Fusion Using Coq. In 2014 16th International Symposium on Symbolic and Numeric Algorithms for Scientific Computing. 180\u2013185","author":"Robillard Simon","year":"2014","unstructured":"Simon Robillard. 2014. Catamorphism Generation and Fusion Using Coq. In 2014 16th International Symposium on Symbolic and Numeric Algorithms for Scientific Computing. 180\u2013185. 10.1109\/SYNASC.2014.32"},{"key":"e_1_3_2_1_33_1","volume-title":"Proceedings of the 32nd ACM SIGPLAN Conference on Programming Language Design and Implementation","author":"Srivastava Saurabh","year":"1993","unstructured":"Saurabh Srivastava, Sumit Gulwani, Swarat Chaudhuri, and Jeffrey S. Foster. 2011. Path-based inductive synthesis for program inversion. In Proceedings of the 32nd ACM SIGPLAN Conference on Programming Language Design and Implementation (San Jose, California, USA) (PLDI '11). Association for Computing Machinery, New York, NY, USA, 492\u2013503. 10.1145\/1993498.1993557"},{"key":"e_1_3_2_1_34_1","volume-title":"Proceedings of the 14th ACM SIGPLAN International Symposium on Haskell (Virtual, Republic of Korea) (Haskell 2021","author":"Teegen Finn","year":"2021","unstructured":"Finn Teegen, Kai-Oliver Prott, and Niels Bunkenburg. 2021. Haskell-1: automatic function inversion in Haskell. In Proceedings of the 14th ACM SIGPLAN International Symposium on Haskell (Virtual, Republic of Korea) (Haskell 2021). Association for Computing Machinery, New York, NY, USA, 41\u201355. 10.1145\/3471874.3472982"},{"key":"e_1_3_2_1_35_1","volume-title":"Proceedings of the 31st International Conference on Neural Information Processing Systems","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N. Gomez, \u0141ukasz Kaiser, and Illia Polosukhin. 2017. Attention is all you need. In Proceedings of the 31st International Conference on Neural Information Processing Systems (Long Beach, California, USA) (NIPS'17). Curran Associates Inc., Red Hook, NY, USA, 6000\u20136010."},{"key":"e_1_3_2_1_36_1","volume-title":"Proceedings of the 2014 ACM International Conference on Object Oriented Programming Systems Languages & Applications","author":"Xiao Tian","year":"2014","unstructured":"Tian Xiao, Zhenyu Guo, Hucheng Zhou, Jiaxing Zhang, Xu Zhao, Chencheng Ye, Xi Wang, Wei Lin, Wenguang Chen, and Lidong Zhou. 2014. Cybertron: pushing the limit on I\/O reduction in data-parallel programs. In Proceedings of the 2014 ACM International Conference on Object Oriented Programming Systems Languages & Applications (Portland, Oregon, USA) (OOPSLA '14). Association for Computing Machinery, New York, NY, USA, 895\u2013908. 10.1145\/2660193.2660204"},{"key":"e_1_3_2_1_37_1","volume-title":"8th USENIX Symposium on Operating Systems Design and Implementation (OSDI 08)","author":"Ylleyu Yuan","year":"2008","unstructured":"Yuan Ylleyu, Michael Isard, Dennis Fetterly, Mihai Budiu, \u00dalfar Erlingsson, Pradeep Kumar Gunda, and Jon Currey. 2008. DryadLINQ: A System for General-Purpose Distributed Data-Parallel Computing Using a High-Level Language. In 8th USENIX Symposium on Operating Systems Design and Implementation (OSDI 08). USENIX Association, San Diego, CA."},{"key":"e_1_3_2_1_38_1","volume-title":"Proceedings of the ACM SIGOPS 22nd Symposium on Operating Systems Principles","author":"Yu Yuan","year":"2009","unstructured":"Yuan Yu, Pradeep Kumar Gunda, and Michael Isard. 2009. Distributed aggregation for data-parallel computing: interfaces and implementations. In Proceedings of the ACM SIGOPS 22nd Symposium on Operating Systems Principles (Big Sky, Montana, USA) (SOSP '09). Association for Computing Machinery, New York, NY, USA, 247\u2013260. 10.1145\/1629575.1629600"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/2934664"}],"event":{"name":"FSE Companion '25: 33rd ACM International Conference on the Foundations of Software Engineering","sponsor":["SIGSOFT ACM Special Interest Group on Software Engineering"],"location":"Clarion Hotel Trondheim Trondheim Norway","acronym":"FSE Companion '25"},"container-title":["Proceedings of the 33rd ACM International Conference on the Foundations of Software Engineering"],"original-title":[],"link":[{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/dl.acm.org\/doi\/pdf\/10.1145\/3696630.3728496","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,28]],"date-time":"2025-07-28T19:12:55Z","timestamp":1753729975000},"score":1,"resource":{"primary":{"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/dl.acm.org\/doi\/10.1145\/3696630.3728496"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,23]]},"references-count":39,"alternative-id":["10.1145\/3696630.3728496","10.1145\/3696630"],"URL":"https:\/\/summer-heart-0930.chufeiyun1688.workers.dev:443\/https\/doi.org\/10.1145\/3696630.3728496","relation":{},"subject":[],"published":{"date-parts":[[2025,6,23]]},"assertion":[{"value":"2025-07-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}