Stop the war!
Остановите войну!
for scientists:
default search action
BibTeX records: Torsten Hoefler
@article{DBLP:journals/csur/BestaGPFPBAH24, author = {Maciej Besta and Robert Gerstenberger and Emanuel Peter and Marc Fischer and Michal Podstawski and Claude Barthels and Gustavo Alonso and Torsten Hoefler}, title = {Demystifying Graph Databases: Analysis and Taxonomy of Data Organization, System Designs, and Graph Queries}, journal = {{ACM} Comput. Surv.}, volume = {56}, number = {2}, pages = {31:1--31:40}, year = {2024}, url = {https://doi.org/10.1145/3604932}, doi = {10.1145/3604932}, timestamp = {Fri, 27 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/csur/BestaGPFPBAH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/fgcs/SensiMGVH24, author = {Daniele De Sensi and Edgar Costa Molero and Salvatore Di Girolamo and Laurent Vanbever and Torsten Hoefler}, title = {Canary: Congestion-aware in-network allreduce using dynamic trees}, journal = {Future Gener. Comput. Syst.}, volume = {152}, pages = {70--82}, year = {2024}, url = {https://doi.org/10.1016/j.future.2023.10.010}, doi = {10.1016/J.FUTURE.2023.10.010}, timestamp = {Fri, 26 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/fgcs/SensiMGVH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ncs/BauerHSH24, author = {Peter Bauer and Torsten Hoefler and Bjorn Stevens and Wilco Hazeleger}, title = {Digital twins of Earth and the computing challenge of human interaction}, journal = {Nat. Comput. Sci.}, volume = {4}, number = {3}, pages = {154--157}, year = {2024}, url = {https://doi.org/10.1038/s43588-024-00599-3}, doi = {10.1038/S43588-024-00599-3}, timestamp = {Mon, 15 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ncs/BauerHSH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pami/BestaH24, author = {Maciej Besta and Torsten Hoefler}, title = {Parallel and Distributed Graph Neural Networks: An In-Depth Concurrency Analysis}, journal = {{IEEE} Trans. Pattern Anal. Mach. Intell.}, volume = {46}, number = {5}, pages = {2584--2606}, year = {2024}, url = {https://doi.org/10.1109/TPAMI.2023.3303431}, doi = {10.1109/TPAMI.2023.3303431}, timestamp = {Mon, 15 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pami/BestaH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tc/BenzRSROKHB24, author = {Thomas Benz and Michael Rogenmoser and Paul Scheffler and Samuel Riedel and Alessandro Ottaviano and Andreas Kurth and Torsten Hoefler and Luca Benini}, title = {A High-Performance, Energy-Efficient Modular {DMA} Engine Architecture}, journal = {{IEEE} Trans. Computers}, volume = {73}, number = {1}, pages = {263--277}, year = {2024}, url = {https://doi.org/10.1109/TC.2023.3329930}, doi = {10.1109/TC.2023.3329930}, timestamp = {Sat, 13 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tc/BenzRSROKHB24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/BestaBKGPGGLNNH24, author = {Maciej Besta and Nils Blach and Ales Kubicek and Robert Gerstenberger and Michal Podstawski and Lukas Gianinazzi and Joanna Gajda and Tomasz Lehmann and Hubert Niewiadomski and Piotr Nyczyk and Torsten Hoefler}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Graph of Thoughts: Solving Elaborate Problems with Large Language Models}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {17682--17690}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i16.29720}, doi = {10.1609/AAAI.V38I16.29720}, timestamp = {Tue, 02 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/BestaBKGPGGLNNH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nsdi/BlachBSDH0IKLKF24, author = {Nils Blach and Maciej Besta and Daniele De Sensi and Jens Domke and Hussein Harake and Shigang Li and Patrick Iff and Marek Konieczny and Kartik Lakhotia and Ales Kubicek and Marcel Ferrari and Fabrizio Petrini and Torsten Hoefler}, editor = {Laurent Vanbever and Irene Zhang}, title = {A High-Performance Design, Implementation, Deployment, and Evaluation of The Slim Fly Network}, booktitle = {21st {USENIX} Symposium on Networked Systems Design and Implementation, {NSDI} 2024, Santa Clara, CA, April 15-17, 2024}, publisher = {{USENIX} Association}, year = {2024}, url = {https://www.usenix.org/conference/nsdi24/presentation/blach}, timestamp = {Fri, 19 Apr 2024 11:29:16 +0200}, biburl = {https://dblp.org/rec/conf/nsdi/BlachBSDH0IKLKF24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nsdi/SensiBSH24, author = {Daniele De Sensi and Tommaso Bonato and David Saam and Torsten Hoefler}, editor = {Laurent Vanbever and Irene Zhang}, title = {Swing: Short-cutting Rings for Higher Bandwidth Allreduce}, booktitle = {21st {USENIX} Symposium on Networked Systems Design and Implementation, {NSDI} 2024, Santa Clara, CA, April 15-17, 2024}, publisher = {{USENIX} Association}, year = {2024}, url = {https://www.usenix.org/conference/nsdi24/presentation/de-sensi}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nsdi/SensiBSH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/GianinazziZHLAS24, author = {Lukas Gianinazzi and Alexandros Nikolaos Ziogas and Langwen Huang and Piotr Luczynski and Saleh Ashkboosh and Florian Scheidl and Armon Carigiet and Chio Ge and Nabil Abubaker and Maciej Besta and Tal Ben{-}Nun and Torsten Hoefler}, editor = {Michel Steuwer and I{-}Ting Angelina Lee and Milind Chabbi}, title = {Arrow Matrix Decomposition: {A} Novel Approach for Communication-Efficient Sparse Matrix Multiplication}, booktitle = {Proceedings of the 29th {ACM} {SIGPLAN} Annual Symposium on Principles and Practice of Parallel Programming, PPoPP 2024, Edinburgh, United Kingdom, March 2-6, 2024}, pages = {404--416}, publisher = {{ACM}}, year = {2024}, url = {https://doi.org/10.1145/3627535.3638496}, doi = {10.1145/3627535.3638496}, timestamp = {Mon, 01 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/GianinazziZHLAS24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-04552, author = {Torsten Hoefler and Marcin Copik and Pete Beckman and Andrew Jones and Ian T. Foster and Manish Parashar and Daniel A. Reed and Matthias Troyer and Thomas C. Schulthess and Dan Ernst and Jack J. Dongarra}, title = {XaaS: Acceleration as a Service to Enable Productive High-Performance Cloud Computing}, journal = {CoRR}, volume = {abs/2401.04552}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.04552}, doi = {10.48550/ARXIV.2401.04552}, eprinttype = {arXiv}, eprint = {2401.04552}, timestamp = {Wed, 24 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-04552.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-05932, author = {Langwen Huang and Lukas Gianinazzi and Yuejiang Yu and Peter D. D{\"{u}}ben and Torsten Hoefler}, title = {DiffDA: a diffusion model for weather-scale data assimilation}, journal = {CoRR}, volume = {abs/2401.05932}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.05932}, doi = {10.48550/ARXIV.2401.05932}, eprinttype = {arXiv}, eprint = {2401.05932}, timestamp = {Thu, 25 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-05932.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-09356, author = {Daniele De Sensi and Tommaso Bonato and David Saam and Torsten Hoefler}, title = {Swing: Short-cutting Rings for Higher Bandwidth Allreduce}, journal = {CoRR}, volume = {abs/2401.09356}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.09356}, doi = {10.48550/ARXIV.2401.09356}, eprinttype = {arXiv}, eprint = {2401.09356}, timestamp = {Thu, 01 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-09356.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-09359, author = {Samuel Riedel and Marc Gantenbein and Alessandro Ottaviano and Torsten Hoefler and Luca Benini}, title = {LRSCwait: Enabling Scalable and Efficient Synchronization in Manycore Systems through Polling-Free and Retry-Free Operation}, journal = {CoRR}, volume = {abs/2401.09359}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.09359}, doi = {10.48550/ARXIV.2401.09359}, eprinttype = {arXiv}, eprint = {2401.09359}, timestamp = {Thu, 01 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-09359.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-10834, author = {Lukas M{\"{o}}ller and Marcin Copik and Alexandru Calotoiu and Torsten Hoefler}, title = {Cppless: Productive and Performant Serverless Programming in {C++}}, journal = {CoRR}, volume = {abs/2401.10834}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.10834}, doi = {10.48550/ARXIV.2401.10834}, eprinttype = {arXiv}, eprint = {2401.10834}, timestamp = {Fri, 02 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-10834.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-10852, author = {Marcin Copik and Marcin Chrapek and Larissa Schmid and Alexandru Calotoiu and Torsten Hoefler}, title = {Software Resource Disaggregation for {HPC} with Serverless Computing}, journal = {CoRR}, volume = {abs/2401.10852}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.10852}, doi = {10.48550/ARXIV.2401.10852}, eprinttype = {arXiv}, eprint = {2401.10852}, timestamp = {Fri, 02 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-10852.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-14295, author = {Maciej Besta and Florim Memedi and Zhenyu Zhang and Robert Gerstenberger and Nils Blach and Piotr Nyczyk and Marcin Copik and Grzegorz Kwasniewski and J{\"{u}}rgen M{\"{u}}ller and Lukas Gianinazzi and Ales Kubicek and Hubert Niewiadomski and Onur Mutlu and Torsten Hoefler}, title = {Topologies of Reasoning: Demystifying Chains, Trees, and Graphs of Thoughts}, journal = {CoRR}, volume = {abs/2401.14295}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.14295}, doi = {10.48550/ARXIV.2401.14295}, eprinttype = {arXiv}, eprint = {2401.14295}, timestamp = {Tue, 06 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-14295.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-15024, author = {Saleh Ashkboos and Maximilian L. Croci and Marcelo Gennari Do Nascimento and Torsten Hoefler and James Hensman}, title = {SliceGPT: Compress Large Language Models by Deleting Rows and Columns}, journal = {CoRR}, volume = {abs/2401.15024}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.15024}, doi = {10.48550/ARXIV.2401.15024}, eprinttype = {arXiv}, eprint = {2401.15024}, timestamp = {Tue, 06 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-15024.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-19364, author = {Lukas Gianinazzi and Alexandros Nikolaos Ziogas and Langwen Huang and Piotr Luczynski and Saleh Ashkboos and Florian Scheidl and Armon Carigiet and Chio Ge and Nabil Abubaker and Maciej Besta and Tal Ben{-}Nun and Torsten Hoefler}, title = {Arrow Matrix Decomposition: {A} Novel Approach for Communication-Efficient Sparse Matrix Multiplication}, journal = {CoRR}, volume = {abs/2402.19364}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.19364}, doi = {10.48550/ARXIV.2402.19364}, eprinttype = {arXiv}, eprint = {2402.19364}, timestamp = {Tue, 26 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-19364.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cacm/HoeflerHT23, author = {Torsten Hoefler and Thomas H{\"{a}}ner and Matthias Troyer}, title = {Disentangling Hype from Practicality: On Realistically Achieving Quantum Advantage}, journal = {Commun. {ACM}}, volume = {66}, number = {5}, pages = {82--87}, year = {2023}, url = {https://doi.org/10.1145/3571725}, doi = {10.1145/3571725}, timestamp = {Thu, 18 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/cacm/HoeflerHT23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/computer/HoeflerRUAGTKAS23, author = {Torsten Hoefler and Duncan Roweth and Keith D. Underwood and Robert Alverson and Mark Griswold and Vahid Tabatabaee and Mohan Kalkunte and Surendra Anubolu and Siyuan Shen and Moray McLaren and Abdul Kabbani and Steve Scott}, title = {Data Center Ethernet and Remote Direct Memory Access: Issues at Hyperscale}, journal = {Computer}, volume = {56}, number = {7}, pages = {67--77}, year = {2023}, url = {https://doi.org/10.1109/MC.2023.3261184}, doi = {10.1109/MC.2023.3261184}, timestamp = {Fri, 07 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/computer/HoeflerRUAGTKAS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cse/HoeflerSPBSSTKMFKGAFZKKSFL23, author = {Torsten Hoefler and Bjorn Stevens and Andreas F. Prein and Johanna Baehr and Thomas C. Schulthess and Thomas F. Stocker and John A. Taylor and Daniel Klocke and Pekka Manninen and Piers M. Forster and Tobias K{\"{o}}lling and Nicolas Gruber and Hartwig Anzt and Claudia Frauen and Florian Ziemen and Milan Kl{\"{o}}wer and Karthik Kashinath and Christoph M. Sch{\"{a}}r and Oliver Fuhrer and Bryan N. Lawrence}, title = {Earth Virtualization Engines: {A} Technical Perspective}, journal = {Comput. Sci. Eng.}, volume = {25}, number = {3}, pages = {50--59}, year = {2023}, url = {https://doi.org/10.1109/MCSE.2023.3311148}, doi = {10.1109/MCSE.2023.3311148}, timestamp = {Thu, 09 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/cse/HoeflerSPBSSTKMFKGAFZKKSFL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijhpca/MatsuokaDWDH23, author = {Satoshi Matsuoka and Jens Domke and Mohamed Wahib and Aleksandr Drozd and Torsten Hoefler}, title = {Myths and legends in high-performance computing}, journal = {Int. J. High Perform. Comput. Appl.}, volume = {37}, number = {3-4}, pages = {245--259}, year = {2023}, url = {https://doi.org/10.1177/10943420231166608}, doi = {10.1177/10943420231166608}, timestamp = {Sat, 05 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijhpca/MatsuokaDWDH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/BestaFKKH23, author = {Maciej Besta and Marc Fischer and Vasiliki Kalavri and Michael Kapralov and Torsten Hoefler}, title = {Practice of Streaming Processing of Dynamic Graphs: Concepts, Models, and Systems}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {34}, number = {6}, pages = {1860--1876}, year = {2023}, url = {https://doi.org/10.1109/TPDS.2021.3131677}, doi = {10.1109/TPDS.2021.3131677}, timestamp = {Fri, 02 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tpds/BestaFKKH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/SchefflerZSHB23, author = {Paul Scheffler and Florian Zaruba and Fabian Schuiki and Torsten Hoefler and Luca Benini}, title = {Sparse Stream Semantic Registers: {A} Lightweight {ISA} Extension Accelerating General Sparse Linear Algebra}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {34}, number = {12}, pages = {3147--3161}, year = {2023}, url = {https://doi.org/10.1109/TPDS.2023.3322029}, doi = {10.1109/TPDS.2023.3322029}, timestamp = {Sun, 10 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tpds/SchefflerZSHB23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/bigdataconf/QiuCWCH23, author = {Wei Qiu and Marcin Copik and Yun Wang and Alexandru Calotoiu and Torsten Hoefler}, editor = {Jingrui He and Themis Palpanas and Xiaohua Hu and Alfredo Cuzzocrea and Dejing Dou and Dominik Slezak and Wei Wang and Aleksandra Gruca and Jerry Chun{-}Wei Lin and Rakesh Agrawal}, title = {User-guided Page Merging for Memory Deduplication in Serverless Systems}, booktitle = {{IEEE} International Conference on Big Data, BigData 2023, Sorrento, Italy, December 15-18, 2023}, pages = {159--169}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/BigData59044.2023.10386487}, doi = {10.1109/BIGDATA59044.2023.10386487}, timestamp = {Fri, 02 Feb 2024 12:00:39 +0100}, biburl = {https://dblp.org/rec/conf/bigdataconf/QiuCWCH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cgo/Ben-NunACH23, author = {Tal Ben{-}Nun and Berke Ates and Alexandru Calotoiu and Torsten Hoefler}, editor = {Christophe Dubach and Derek Bruening and Ben Hardekopf}, title = {Bridging Control-Centric and Data-Centric Optimization}, booktitle = {Proceedings of the 21st {ACM/IEEE} International Symposium on Code Generation and Optimization, {CGO} 2023, Montr{\'{e}}al, QC, Canada, 25 February 2023- 1 March 2023}, pages = {173--185}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3579990.3580018}, doi = {10.1145/3579990.3580018}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cgo/Ben-NunACH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ciac/BenNunGHO23, author = {Tal Ben{-}Nun and Lukas Gianinazzi and Torsten Hoefler and Yishai Oltchik}, editor = {Marios Mavronicolas}, title = {Maximum Flows in Parametric Graph Templates}, booktitle = {Algorithms and Complexity - 13th International Conference, {CIAC} 2023, Larnaca, Cyprus, June 13-16, 2023, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {13898}, pages = {97--111}, publisher = {Springer}, year = {2023}, url = {https://doi.org/10.1007/978-3-031-30448-4\_8}, doi = {10.1007/978-3-031-30448-4\_8}, timestamp = {Wed, 17 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ciac/BenNunGHO23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dac/IffBCFBH23, author = {Patrick Iff and Maciej Besta and Matheus A. Cavalcante and Tim Fischer and Luca Benini and Torsten Hoefler}, title = {Sparse Hamming Graph: {A} Customizable Network-on-Chip Topology}, booktitle = {60th {ACM/IEEE} Design Automation Conference, {DAC} 2023, San Francisco, CA, USA, July 9-13, 2023}, pages = {1--6}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/DAC56929.2023.10247754}, doi = {10.1109/DAC56929.2023.10247754}, timestamp = {Sun, 24 Sep 2023 13:31:06 +0200}, biburl = {https://dblp.org/rec/conf/dac/IffBCFBH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dac/IffBCFBH23a, author = {Patrick Iff and Maciej Besta and Matheus A. Cavalcante and Tim Fischer and Luca Benini and Torsten Hoefler}, title = {HexaMesh: Scaling to Hundreds of Chiplets with an Optimized Chiplet Arrangement}, booktitle = {60th {ACM/IEEE} Design Automation Conference, {DAC} 2023, San Francisco, CA, USA, July 9-13, 2023}, pages = {1--6}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/DAC56929.2023.10248006}, doi = {10.1109/DAC56929.2023.10248006}, timestamp = {Sun, 24 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/dac/IffBCFBH23a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/MatteisGLH23, author = {Tiziano De Matteis and Lukas Gianinazzi and Johannes de Fine Licht and Torsten Hoefler}, editor = {Ali Raza Butt and Ningfang Mi and Kyle Chard}, title = {Streaming Task Graph Scheduling for Dataflow Architectures}, booktitle = {Proceedings of the 32nd International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2023, Orlando, FL, USA, June 16-23, 2023}, pages = {225--237}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3588195.3592999}, doi = {10.1145/3588195.3592999}, timestamp = {Thu, 31 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/hpdc/MatteisGLH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/LiGHMEV23, author = {Yunqiang Li and Jan C. van Gemert and Torsten Hoefler and Bert Moons and Evangelos Eleftheriou and Bram{-}Ernst Verhoef}, title = {Differentiable Transportation Pruning}, booktitle = {{IEEE/CVF} International Conference on Computer Vision, {ICCV} 2023, Paris, France, October 1-6, 2023}, pages = {16911--16921}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/ICCV51070.2023.01555}, doi = {10.1109/ICCV51070.2023.01555}, timestamp = {Mon, 22 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iccv/LiGHMEV23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/FrantarAHA23, author = {Elias Frantar and Saleh Ashkboos and Torsten Hoefler and Dan Alistarh}, title = {{OPTQ:} Accurate Quantization for Generative Pre-trained Transformers}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/pdf?id=tcbBPnfwxS}, timestamp = {Fri, 30 Jun 2023 14:38:38 +0200}, biburl = {https://dblp.org/rec/conf/iclr/FrantarAHA23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/HuangH23, author = {Langwen Huang and Torsten Hoefler}, title = {Compressing multidimensional weather and climate data into neural networks}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/pdf?id=Y5SEe3dfniJ}, timestamp = {Fri, 30 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/HuangH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/TrumperBSCH23, author = {Lukas Tr{\"{u}}mper and Tal Ben{-}Nun and Philipp Schaad and Alexandru Calotoiu and Torsten Hoefler}, editor = {Kyle A. Gallivan and Efstratios Gallopoulos and Dimitrios S. Nikolopoulos and Ram{\'{o}}n Beivide}, title = {Performance Embeddings: {A} Similarity-Based Transfer Tuning Approach to Performance Optimization}, booktitle = {Proceedings of the 37th International Conference on Supercomputing, {ICS} 2023, Orlando, FL, USA, June 21-23, 2023}, pages = {50--62}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3577193.3593714}, doi = {10.1145/3577193.3593714}, timestamp = {Fri, 07 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ics/TrumperBSCH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/CopikBCH23, author = {Marcin Copik and Roman B{\"{o}}hringer and Alexandru Calotoiu and Torsten Hoefler}, editor = {Kyle A. Gallivan and Efstratios Gallopoulos and Dimitrios S. Nikolopoulos and Ram{\'{o}}n Beivide}, title = {{FMI:} Fast and Cheap Message Passing for Serverless Functions}, booktitle = {Proceedings of the 37th International Conference on Supercomputing, {ICS} 2023, Orlando, FL, USA, June 21-23, 2023}, pages = {373--385}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3577193.3593718}, doi = {10.1145/3577193.3593718}, timestamp = {Fri, 07 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ics/CopikBCH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/CopikTCH23, author = {Marcin Copik and Konstantin Taranov and Alexandru Calotoiu and Torsten Hoefler}, title = {rFaaS: Enabling High Performance Serverless with {RDMA} and Leases}, booktitle = {{IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2023, St. Petersburg, FL, USA, May 15-19, 2023}, pages = {897--907}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/IPDPS54959.2023.00094}, doi = {10.1109/IPDPS54959.2023.00094}, timestamp = {Tue, 25 Jul 2023 16:27:14 +0200}, biburl = {https://dblp.org/rec/conf/ipps/CopikTCH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/qce/NguyenSSSWRHL23, author = {Tommy Nguyen and Yue Shi and Samuel Alexander Stein and Tim Stavenger and Marvin Warner and Martin Roetteler and Torsten Hoefler and Ang Li}, editor = {Brian La Cour and Lia Yeh and Marek Osinski}, title = {A Reference Implementation for a Quantum Message Passing Interface}, booktitle = {{IEEE} International Conference on Quantum Computing and Engineering, {QCE} 2023, Bellevue, WA, USA, September 17-22, 2023}, pages = {292--293}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/QCE57702.2023.10248}, doi = {10.1109/QCE57702.2023.10248}, timestamp = {Fri, 15 Dec 2023 20:24:40 +0100}, biburl = {https://dblp.org/rec/conf/qce/NguyenSSSWRHL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaGFPBEMCMNM23, author = {Maciej Besta and Robert Gerstenberger and Marc Fischer and Michal Podstawski and Nils Blach and Berke Egeli and George Mitenkov and Wojciech Chlapek and Marek T. Michalewicz and Hubert Niewiadomski and J{\"{u}}rgen M{\"{u}}ller and Torsten Hoefler}, editor = {Dorian Arnold and Rosa M. Badia and Kathryn M. Mohror}, title = {The Graph Database Interface: Scaling Online Transactional and Analytical Graph Workloads to Hundreds of Thousands of Cores}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {22:1--22:18}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3581784.3607068}, doi = {10.1145/3581784.3607068}, timestamp = {Thu, 09 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/BestaGFPBEMCMNM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/ChrapekKH23, author = {Marcin Chrapek and Mikhail Khalilov and Torsten Hoefler}, editor = {Dorian Arnold and Rosa M. Badia and Kathryn M. Mohror}, title = {{HEAR:} Homomorphically Encrypted Allreduce}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {36:1--36:17}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3581784.3607099}, doi = {10.1145/3581784.3607099}, timestamp = {Tue, 28 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/ChrapekKH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaRGLZCGSSCI23, author = {Maciej Besta and Pawel Renc and Robert Gerstenberger and Paolo Sylos Labini and Alexandros Nikolaos Ziogas and Tiancheng Chen and Lukas Gianinazzi and Florian Scheidl and Kalman Szenes and Armon Carigiet and Patrick Iff and Grzegorz Kwasniewski and Raghavendra Kanakagiri and Chio Ge and Sammy Jaeger and Jaroslaw Was and Flavio Vella and Torsten Hoefler}, editor = {Dorian Arnold and Rosa M. Badia and Kathryn M. Mohror}, title = {High-Performance and Programmable Attentional Graph Neural Networks with Global Tensor Formulations}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {66:1--66:16}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3581784.3607067}, doi = {10.1145/3581784.3607067}, timestamp = {Sun, 12 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/BestaRGLZCGSSCI23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/CastroIABFH23, author = {Roberto L. Castro and Andrei Ivanov and Diego Andrade and Tal Ben{-}Nun and Basilio B. Fraguela and Torsten Hoefler}, editor = {Dorian Arnold and Rosa M. Badia and Kathryn M. Mohror}, title = {{VENOM:} {A} Vectorized {N:} {M} Format for Unleashing the Power of Sparse Tensor Cores}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {72:1--72:14}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3581784.3607087}, doi = {10.1145/3581784.3607087}, timestamp = {Tue, 28 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/CastroIABFH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/JiangLZLHSRZRHA23, author = {Wenqi Jiang and Shigang Li and Yu Zhu and Johannes de Fine Licht and Zhenhao He and Runbin Shi and C{\'{e}}dric Renggli and Shuai Zhang and Theodoros Rekatsinas and Torsten Hoefler and Gustavo Alonso}, editor = {Dorian Arnold and Rosa M. Badia and Kathryn M. Mohror}, title = {Co-design Hardware and Algorithm for Vector Search}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {87:1--87:15}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3581784.3607045}, doi = {10.1145/3581784.3607045}, timestamp = {Fri, 24 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/JiangLZLHSRZRHA23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/SchaadSBCZH23, author = {Philipp Schaad and Timo Schneider and Tal Ben{-}Nun and Alexandru Calotoiu and Alexandros Nikolaos Ziogas and Torsten Hoefler}, editor = {Dorian Arnold and Rosa M. Badia and Kathryn M. Mohror}, title = {FuzzyFlow: Leveraging Dataflow To Find and Squash Program Optimization Bugs}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {88:1--88:15}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3581784.3613214}, doi = {10.1145/3581784.3613214}, timestamp = {Thu, 09 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/SchaadSBCZH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/ShiNSSWRHL23, author = {Yue Shi and Tommy Nguyen and Samuel Alexander Stein and Tim Stavenger and Marvin Warner and Martin Roetteler and Torsten Hoefler and Ang Li}, title = {A Reference Implementation for a Quantum Message Passing Interface}, booktitle = {Proceedings of the {SC} '23 Workshops of The International Conference on High Performance Computing, Network, Storage, and Analysis, {SC-W} 2023, Denver, CO, USA, November 12-17, 2023}, pages = {1420--1425}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3624062.3624212}, doi = {10.1145/3624062.3624212}, timestamp = {Thu, 30 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/ShiNSSWRHL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigmetrics/SensiMTGRH23, author = {Daniele De Sensi and Tiziano De Matteis and Konstantin Taranov and Salvatore Di Girolamo and Tobias Rahn and Torsten Hoefler}, editor = {Evgenia Smirni and Konstantin Avrachenkov and Phillipa Gill and Bhuvan Urgaonkar}, title = {Noise in the Clouds: Influence of Network Performance Variability on Application Scalability}, booktitle = {Abstract Proceedings of the 2023 {ACM} {SIGMETRICS} International Conference on Measurement and Modeling of Computer Systems, {SIGMETRICS} 2023, Orlando, FL, USA, June 19-23, 2023}, pages = {17--18}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3578338.3593555}, doi = {10.1145/3578338.3593555}, timestamp = {Fri, 07 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigmetrics/SensiMTGRH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/LakhotiaIMBHP23, author = {Kartik Lakhotia and Kelly Isham and Laura Monroe and Maciej Besta and Torsten Hoefler and Fabrizio Petrini}, editor = {Kunal Agrawal and Julian Shun}, title = {In-network Allreduce with Multiple Spanning Trees on PolarFly}, booktitle = {Proceedings of the 35th {ACM} Symposium on Parallelism in Algorithms and Architectures, {SPAA} 2023, Orlando, FL, USA, June 17-19, 2023}, pages = {165--176}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3558481.3591073}, doi = {10.1145/3558481.3591073}, timestamp = {Thu, 15 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/spaa/LakhotiaIMBHP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/usenix/IvanovRDCHP23, author = {Andrei Ivanov and Benjamin Rothenberger and Arnaud Dethise and Marco Canini and Torsten Hoefler and Adrian Perrig}, editor = {Julia Lawall and Dan Williams}, title = {{SAGE:} Software-based Attestation for {GPU} Execution}, booktitle = {2023 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2023, Boston, MA, USA, July 10-12, 2023}, pages = {485--499}, publisher = {{USENIX} Association}, year = {2023}, url = {https://www.usenix.org/conference/atc23/presentation/ivanov}, timestamp = {Sat, 15 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/usenix/IvanovRDCHP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-01048, author = {Niels Gleinig and Tal Ben{-}Nun and Torsten Hoefler}, title = {A Theory of I/O-Efficient Sparse Neural Network Inference}, journal = {CoRR}, volume = {abs/2301.01048}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.01048}, doi = {10.48550/ARXIV.2301.01048}, eprinttype = {arXiv}, eprint = {2301.01048}, timestamp = {Tue, 10 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-01048.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-02432, author = {Satoshi Matsuoka and Jens Domke and Mohamed Wahib and Aleksandr Drozd and Torsten Hoefler}, title = {Myths and Legends in High-Performance Computing}, journal = {CoRR}, volume = {abs/2301.02432}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.02432}, doi = {10.48550/ARXIV.2301.02432}, eprinttype = {arXiv}, eprint = {2301.02432}, timestamp = {Tue, 10 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-02432.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-06813, author = {Jinfan Chen and Shigang Li and Ran Guo and Jinhui Yuan and Torsten Hoefler}, title = {AutoDDL: Automatic Distributed Deep Learning with Asymptotically Optimal Communication}, journal = {CoRR}, volume = {abs/2301.06813}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.06813}, doi = {10.48550/ARXIV.2301.06813}, eprinttype = {arXiv}, eprint = {2301.06813}, timestamp = {Thu, 19 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-06813.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-01066, author = {Niels Gleinig and Tobias Rohner and Torsten Hoefler}, title = {Approximate Reversible Circuits for NISQ-Era Quantum Computers}, journal = {CoRR}, volume = {abs/2302.01066}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.01066}, doi = {10.48550/ARXIV.2302.01066}, eprinttype = {arXiv}, eprint = {2302.01066}, timestamp = {Thu, 09 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-01066.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-03337, author = {Torsten Hoefler and Duncan Roweth and Keith D. Underwood and Bob Alverson and Mark Griswold and Vahid Tabatabaee and Mohan Kalkunte and Surendra Anubolu and Siyuan Shen and Abdul Kabbani and Moray McLaren and Steve Scott}, title = {Datacenter Ethernet and {RDMA:} Issues at Hyperscale}, journal = {CoRR}, volume = {abs/2302.03337}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.03337}, doi = {10.48550/ARXIV.2302.03337}, eprinttype = {arXiv}, eprint = {2302.03337}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-03337.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-07217, author = {Kartik Lakhotia and Laura Monroe and Kelly Isham and Maciej Besta and Nils Blach and Torsten Hoefler and Fabrizio Petrini}, title = {PolarStar: Expanding the Scalability Horizon of Diameter-3 Networks}, journal = {CoRR}, volume = {abs/2302.07217}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.07217}, doi = {10.48550/ARXIV.2302.07217}, eprinttype = {arXiv}, eprint = {2302.07217}, timestamp = {Mon, 20 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-07217.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2303-08142, author = {Lukas Tr{\"{u}}mper and Tal Ben{-}Nun and Philipp Schaad and Alexandru Calotoiu and Torsten Hoefler}, title = {Performance Embeddings: {A} Similarity-based Approach to Automatic Performance Optimization}, journal = {CoRR}, volume = {abs/2303.08142}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2303.08142}, doi = {10.48550/ARXIV.2303.08142}, eprinttype = {arXiv}, eprint = {2303.08142}, timestamp = {Mon, 20 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2303-08142.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2304-07613, author = {Andrei Ivanov and Nikoli Dryden and Tal Ben{-}Nun and Saleh Ashkboos and Torsten Hoefler}, title = {STen: Productive and Efficient Sparsity in PyTorch}, journal = {CoRR}, volume = {abs/2304.07613}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2304.07613}, doi = {10.48550/ARXIV.2304.07613}, eprinttype = {arXiv}, eprint = {2304.07613}, timestamp = {Fri, 21 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2304-07613.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-04684, author = {Kazuki Osawa and Satoki Ishikawa and Rio Yokota and Shigang Li and Torsten Hoefler}, title = {{ASDL:} {A} Unified Interface for Gradient Preconditioning in PyTorch}, journal = {CoRR}, volume = {abs/2305.04684}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.04684}, doi = {10.48550/ARXIV.2305.04684}, eprinttype = {arXiv}, eprint = {2305.04684}, timestamp = {Fri, 12 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-04684.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-05240, author = {Thomas Benz and Michael Rogenmoser and Paul Scheffler and Samuel Riedel and Alessandro Ottaviano and Andreas Kurth and Torsten Hoefler and Luca Benini}, title = {A High-performance, Energy-efficient Modular {DMA} Engine Architecture}, journal = {CoRR}, volume = {abs/2305.05240}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.05240}, doi = {10.48550/ARXIV.2305.05240}, eprinttype = {arXiv}, eprint = {2305.05240}, timestamp = {Fri, 12 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-05240.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-05559, author = {Paul Scheffler and Florian Zaruba and Fabian Schuiki and Torsten Hoefler and Luca Benini}, title = {Sparse Stream Semantic Registers: {A} Lightweight {ISA} Extension Accelerating General Sparse Linear Algebra}, journal = {CoRR}, volume = {abs/2305.05559}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.05559}, doi = {10.48550/ARXIV.2305.05559}, eprinttype = {arXiv}, eprint = {2305.05559}, timestamp = {Mon, 15 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-05559.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-08763, author = {Marcin Copik and Roman B{\"{o}}hringer and Alexandru Calotoiu and Torsten Hoefler}, title = {{FMI:} Fast and Cheap Message Passing for Serverless Functions}, journal = {CoRR}, volume = {abs/2305.08763}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.08763}, doi = {10.48550/ARXIV.2305.08763}, eprinttype = {arXiv}, eprint = {2305.08763}, timestamp = {Wed, 17 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-08763.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-11162, author = {Maciej Besta and Robert Gerstenberger and Marc Fischer and Michal Podstawski and J{\"{u}}rgen M{\"{u}}ller and Nils Blach and Berke Egeli and George Mitenkov and Wojciech Chlapek and Marek T. Michalewicz and Torsten Hoefler}, title = {High-Performance Graph Databases That Are Portable, Programmable, and Scale to Hundreds of Thousands of Cores}, journal = {CoRR}, volume = {abs/2305.11162}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.11162}, doi = {10.48550/ARXIV.2305.11162}, eprinttype = {arXiv}, eprint = {2305.11162}, timestamp = {Sun, 30 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-11162.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-00366, author = {Tal Ben{-}Nun and Berke Ates and Alexandru Calotoiu and Torsten Hoefler}, title = {Bridging Control-Centric and Data-Centric Optimization}, journal = {CoRR}, volume = {abs/2306.00366}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.00366}, doi = {10.48550/ARXIV.2306.00366}, eprinttype = {arXiv}, eprint = {2306.00366}, timestamp = {Mon, 12 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-00366.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-02730, author = {Tiziano De Matteis and Lukas Gianinazzi and Johannes de Fine Licht and Torsten Hoefler}, title = {Streaming Task Graph Scheduling for Dataflow Architectures}, journal = {CoRR}, volume = {abs/2306.02730}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.02730}, doi = {10.48550/ARXIV.2306.02730}, eprinttype = {arXiv}, eprint = {2306.02730}, timestamp = {Tue, 13 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-02730.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-03078, author = {Tim Dettmers and Ruslan Svirschevski and Vage Egiazarian and Denis Kuznedelev and Elias Frantar and Saleh Ashkboos and Alexander Borzunov and Torsten Hoefler and Dan Alistarh}, title = {SpQR: {A} Sparse-Quantized Representation for Near-Lossless {LLM} Weight Compression}, journal = {CoRR}, volume = {abs/2306.03078}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.03078}, doi = {10.48550/ARXIV.2306.03078}, eprinttype = {arXiv}, eprint = {2306.03078}, timestamp = {Tue, 13 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-03078.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-11182, author = {Wenqi Jiang and Shigang Li and Yu Zhu and Johannes de Fine Licht and Zhenhao He and Runbin Shi and C{\'{e}}dric Renggli and Shuai Zhang and Theodoros Rekatsinas and Torsten Hoefler and Gustavo Alonso}, title = {Co-design Hardware and Algorithm for Vector Search}, journal = {CoRR}, volume = {abs/2306.11182}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.11182}, doi = {10.48550/ARXIV.2306.11182}, eprinttype = {arXiv}, eprint = {2306.11182}, timestamp = {Thu, 19 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-11182.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-16178, author = {Philipp Schaad and Timo Schneider and Tal Ben{-}Nun and Alexandru Calotoiu and Alexandros Nikolaos Ziogas and Torsten Hoefler}, title = {FuzzyFlow: Leveraging Dataflow To Find and Squash Program Optimization Bugs}, journal = {CoRR}, volume = {abs/2306.16178}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.16178}, doi = {10.48550/ARXIV.2306.16178}, eprinttype = {arXiv}, eprint = {2306.16178}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-16178.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-00523, author = {Torsten Hoefler and Thomas H{\"{a}}ner and Matthias Troyer}, title = {Disentangling Hype from Practicality: On Realistically Achieving Quantum Advantage}, journal = {CoRR}, volume = {abs/2307.00523}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.00523}, doi = {10.48550/ARXIV.2307.00523}, eprinttype = {arXiv}, eprint = {2307.00523}, timestamp = {Mon, 10 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-00523.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-08420, author = {Tal Ben{-}Nun and Lukas Gianinazzi and Torsten Hoefler and Yishai Oltchik}, title = {Maximum Flows in Parametric Graph Templates}, journal = {CoRR}, volume = {abs/2307.08420}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.08420}, doi = {10.48550/ARXIV.2307.08420}, eprinttype = {arXiv}, eprint = {2307.08420}, timestamp = {Tue, 25 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-08420.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-08483, author = {Yunqiang Li and Jan C. van Gemert and Torsten Hoefler and Bert Moons and Evangelos Eleftheriou and Bram{-}Ernst Verhoef}, title = {Differentiable Transportation Pruning}, journal = {CoRR}, volume = {abs/2307.08483}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.08483}, doi = {10.48550/ARXIV.2307.08483}, eprinttype = {arXiv}, eprint = {2307.08483}, timestamp = {Tue, 25 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-08483.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-09687, author = {Maciej Besta and Nils Blach and Ales Kubicek and Robert Gerstenberger and Lukas Gianinazzi and Joanna Gajda and Tomasz Lehmann and Michal Podstawski and Hubert Niewiadomski and Piotr Nyczyk and Torsten Hoefler}, title = {Graph of Thoughts: Solving Elaborate Problems with Large Language Models}, journal = {CoRR}, volume = {abs/2308.09687}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.09687}, doi = {10.48550/ARXIV.2308.09687}, eprinttype = {arXiv}, eprint = {2308.09687}, timestamp = {Fri, 25 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-09687.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-12093, author = {Julia Bazinska and Andrei Ivanov and Tal Ben{-}Nun and Nikoli Dryden and Maciej Besta and Siyuan Shen and Torsten Hoefler}, title = {Cached Operator Reordering: {A} Unified View for Fast {GNN} Training}, journal = {CoRR}, volume = {abs/2308.12093}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.12093}, doi = {10.48550/ARXIV.2308.12093}, eprinttype = {arXiv}, eprint = {2308.12093}, timestamp = {Wed, 30 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-12093.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-03628, author = {Mikhail Khalilov and Marcin Chrapek and Siyuan Shen and Alessandro Vezzu and Thomas Benz and Salvatore Di Girolamo and Timo Schneider and Daniele De Sensi and Luca Benini and Torsten Hoefler}, title = {{OSMOSIS:} Enabling Multi-Tenancy in Datacenter SmartNICs}, journal = {CoRR}, volume = {abs/2309.03628}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.03628}, doi = {10.48550/ARXIV.2309.03628}, eprinttype = {arXiv}, eprint = {2309.03628}, timestamp = {Tue, 12 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-03628.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-09002, author = {Torsten Hoefler and Bjorn Stevens and Andreas F. Prein and Johanna Baehr and Thomas C. Schulthess and Thomas F. Stocker and John A. Taylor and Daniel Klocke and Pekka Manninen and Piers M. Forster and Tobias K{\"{o}}lling and Nicolas Gruber and Hartwig Anzt and Claudia Frauen and Florian Ziemen and Milan Kl{\"{o}}wer and Karthik Kashinath and Christoph M. Sch{\"{a}}r and Oliver Fuhrer and Bryan N. Lawrence}, title = {Earth Virtualization Engines - {A} Technical Perspective}, journal = {CoRR}, volume = {abs/2309.09002}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.09002}, doi = {10.48550/ARXIV.2309.09002}, eprinttype = {arXiv}, eprint = {2309.09002}, timestamp = {Wed, 08 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-09002.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-16214, author = {Daniele De Sensi and Edgar Costa Molero and Salvatore Di Girolamo and Laurent Vanbever and Torsten Hoefler}, title = {Canary: Congestion-Aware In-Network Allreduce Using Dynamic Trees}, journal = {CoRR}, volume = {abs/2309.16214}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.16214}, doi = {10.48550/ARXIV.2309.16214}, eprinttype = {arXiv}, eprint = {2309.16214}, timestamp = {Tue, 17 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-16214.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-02065, author = {Roberto L. Castro and Andrei Ivanov and Diego Andrade and Tal Ben{-}Nun and Basilio B. Fraguela and Torsten Hoefler}, title = {{VENOM:} {A} Vectorized {N:} {M} Format for Unleashing the Power of Sparse Tensor Cores}, journal = {CoRR}, volume = {abs/2310.02065}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.02065}, doi = {10.48550/ARXIV.2310.02065}, eprinttype = {arXiv}, eprint = {2310.02065}, timestamp = {Thu, 19 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-02065.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-03742, author = {Nils Blach and Maciej Besta and Daniele De Sensi and Jens Domke and Hussein Harake and Shigang Li and Patrick Iff and Marek Konieczny and Kartik Lakhotia and Ales Kubicek and Marcel Ferrari and Fabrizio Petrini and Torsten Hoefler}, title = {A High-Performance Design, Implementation, Deployment, and Evaluation of The Slim Fly Network}, journal = {CoRR}, volume = {abs/2310.03742}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.03742}, doi = {10.48550/ARXIV.2310.03742}, eprinttype = {arXiv}, eprint = {2310.03742}, timestamp = {Thu, 19 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-03742.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-09259, author = {Saleh Ashkboos and Ilia Markov and Elias Frantar and Tingxuan Zhong and Xincheng Wang and Jie Ren and Torsten Hoefler and Dan Alistarh}, title = {Towards End-to-end 4-Bit Inference on Generative Large Language Models}, journal = {CoRR}, volume = {abs/2310.09259}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.09259}, doi = {10.48550/ARXIV.2310.09259}, eprinttype = {arXiv}, eprint = {2310.09259}, timestamp = {Wed, 25 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-09259.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-09949, author = {Wenqi Jiang and Marco Zeller and Roger Waleffe and Torsten Hoefler and Gustavo Alonso}, title = {Chameleon: a Heterogeneous and Disaggregated Accelerator System for Retrieval-Augmented Language Models}, journal = {CoRR}, volume = {abs/2310.09949}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.09949}, doi = {10.48550/ARXIV.2310.09949}, eprinttype = {arXiv}, eprint = {2310.09949}, timestamp = {Wed, 25 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-09949.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-06081, author = {Patrick Iff and Benigna Bruggmann and Maciej Besta and Luca Benini and Torsten Hoefler}, title = {RapidChiplet: {A} Toolchain for Rapid Design Space Exploration of Chiplet Architectures}, journal = {CoRR}, volume = {abs/2311.06081}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.06081}, doi = {10.48550/ARXIV.2311.06081}, eprinttype = {arXiv}, eprint = {2311.06081}, timestamp = {Wed, 15 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-06081.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-13588, author = {Wei Qiu and Marcin Copik and Yun Wang and Alexandru Calotoiu and Torsten Hoefler}, title = {User-guided Page Merging for Memory Deduplication in Serverless Systems}, journal = {CoRR}, volume = {abs/2311.13588}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.13588}, doi = {10.48550/ARXIV.2311.13588}, eprinttype = {arXiv}, eprint = {2311.13588}, timestamp = {Thu, 30 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-13588.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-18526, author = {Maciej Besta and Afonso Claudino Catarino and Lukas Gianinazzi and Nils Blach and Piotr Nyczyk and Hubert Niewiadomski and Torsten Hoefler}, title = {{HOT:} Higher-Order Dynamic Graph Representation Learning with Efficient Transformers}, journal = {CoRR}, volume = {abs/2311.18526}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.18526}, doi = {10.48550/ARXIV.2311.18526}, eprinttype = {arXiv}, eprint = {2311.18526}, timestamp = {Tue, 05 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-18526.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2312-13547, author = {Eldar Kurtic and Torsten Hoefler and Dan Alistarh}, title = {How to Prune Your Language Model: Recovering Accuracy on the "Sparsity May Cry" Benchmark}, journal = {CoRR}, volume = {abs/2312.13547}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2312.13547}, doi = {10.48550/ARXIV.2312.13547}, eprinttype = {arXiv}, eprint = {2312.13547}, timestamp = {Wed, 17 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2312-13547.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/computer/HoeflerHR22, author = {Torsten Hoefler and Ariel Hendel and Duncan Roweth}, title = {The Convergence of Hyperscale Data Center and High-Performance Computing Networks}, journal = {Computer}, volume = {55}, number = {7}, pages = {29--37}, year = {2022}, url = {https://doi.org/10.1109/MC.2022.3158437}, doi = {10.1109/MC.2022.3158437}, timestamp = {Wed, 06 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/computer/HoeflerHR22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/computer/Hoefler22, author = {Torsten Hoefler}, title = {Benchmarking Data Science: 12 Ways to Lie With Statistics and Performance on Parallel Computers}, journal = {Computer}, volume = {55}, number = {8}, pages = {49--56}, year = {2022}, url = {https://doi.org/10.1109/MC.2022.3152681}, doi = {10.1109/MC.2022.3152681}, timestamp = {Tue, 09 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/computer/Hoefler22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/CopikGHBB22, author = {Marcin Copik and Tobias Grosser and Torsten Hoefler and Paolo Bientinesi and Benjamin Berkels}, title = {Work-Stealing Prefix Scan: Addressing Load Imbalance in Large-Scale Image Registration}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {33}, number = {3}, pages = {523--535}, year = {2022}, url = {https://doi.org/10.1109/TPDS.2021.3095230}, doi = {10.1109/TPDS.2021.3095230}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tpds/CopikGHBB22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ccs/TaranovRSPH22, author = {Konstantin Taranov and Benjamin Rothenberger and Daniele De Sensi and Adrian Perrig and Torsten Hoefler}, editor = {Heng Yin and Angelos Stavrou and Cas Cremers and Elaine Shi}, title = {NeVerMore: Exploiting {RDMA} Mistakes in NVMe-oF Storage Applications}, booktitle = {Proceedings of the 2022 {ACM} {SIGSAC} Conference on Computer and Communications Security, {CCS} 2022, Los Angeles, CA, USA, November 7-11, 2022}, pages = {2765--2778}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3548606.3560568}, doi = {10.1145/3548606.3560568}, timestamp = {Sat, 17 Dec 2022 01:15:29 +0100}, biburl = {https://dblp.org/rec/conf/ccs/TaranovRSPH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/date/CossettiniTVMHB22, author = {Andrea Cossettini and Konstantin Taranov and Christian Vogt and Michele Magno and Torsten Hoefler and Luca Benini}, editor = {Cristiana Bolchini and Ingrid Verbauwhede and Ioana Vatajelu}, title = {A {RDMA} Interface for Ultra-Fast Ultrasound Data-Streaming over an Optical Link}, booktitle = {2022 Design, Automation {\&} Test in Europe Conference {\&} Exhibition, {DATE} 2022, Antwerp, Belgium, March 14-23, 2022}, pages = {80--83}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.23919/DATE54114.2022.9774599}, doi = {10.23919/DATE54114.2022.9774599}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/date/CossettiniTVMHB22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/date/GleinigH22, author = {Niels Gleinig and Torsten Hoefler}, editor = {Cristiana Bolchini and Ingrid Verbauwhede and Ioana Vatajelu}, title = {Circuits for Measurement Based Quantum State Preparation}, booktitle = {2022 Design, Automation {\&} Test in Europe Conference {\&} Exhibition, {DATE} 2022, Antwerp, Belgium, March 14-23, 2022}, pages = {328--333}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.23919/DATE54114.2022.9774680}, doi = {10.23919/DATE54114.2022.9774680}, timestamp = {Wed, 25 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/date/GleinigH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dsd/BiagioniCFCLMPP22, author = {Andrea Biagioni and Paolo Cretaro and Ottorino Frezza and Francesca Lo Cicero and Alessandro Lonardo and Michele Martinelli and Pier Stanislao Paolucci and Elena Pastorelli and Francesco Simula and Matteo Turisini and Piero Vicini and Roberto Ammendola and Pascale Bernier{-}Bruna and Claire Chen and Said Derradji and St{\'{e}}phane Guez and Pierre{-}Axel Lagadec and Gregoire Pichon and Etienne Walter and Gaetan De Gassowski and Matthieu Hautreaux and Stephane Mathieu and Gilles Moreau and Marc P{\'{e}}rache and Hugo Taboada and Torsten Hoefler and Timo Schneider and Matteo Barnaba and Giuseppe Piero Brandino and Francesco De Giorgi and Matteo Poggi and Iakovos Mavroidis and Yannis Papaefstathiou and Nikolaos Tampouratzis and Benjamin Kalisch and Ulrich Krackhardt and Mondrian Nuessle and Pantelis Xirouchakis and Vangelis Mageiropoulos and Michalis Gianioudis and Harisis Loukas and Aggelos Ioannou and Nikos Kallimanis and Nikos Chrysos and Manolis Katevenis and Wolfang Frings and Dominik Gottwald and Felime Guimaraes and Max Holicki and Volker Marx and Yannik Muller and Carsten Clauss and Hugo Falter and Xu Huang and Jennifer Lopez Barillao and Thomas Moschny and Simon Pickartz and Francisco J. Alfaro and Jes{\'{u}}s Escudero{-}Sahuquillo and Pedro Javier Garc{\'{\i}}a and Francisco J. Quiles and Jos{\'{e}} L. S{\'{a}}nchez and Adri{\'{a}}n Castell{\'{o}} and Jose Duro and Mar{\'{\i}}a Engracia G{\'{o}}mez and Enrique S. Quintana{-}Ort{\'{\i}} and Julio Sahuquillo and Eugenio Stabile}, title = {{RED-SEA:} Network Solution for Exascale Architectures}, booktitle = {25th Euromicro Conference on Digital System Design, {DSD} 2022, Maspalomas, Spain, August 31 - Sept. 2, 2022}, pages = {712--719}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/DSD57027.2022.00100}, doi = {10.1109/DSD57027.2022.00100}, timestamp = {Sun, 12 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/dsd/BiagioniCFCLMPP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/exampi/CaoGH22, author = {Shiyi Cao and Salvatore Di Girolamo and Torsten Hoefler}, title = {Accelerating Data Serialization/Deserialization Protocols with In-Network Compute}, booktitle = {{IEEE/ACM} International Workshop on Exascale MPI, ExaMPI@SC 2022, Dallas, TX, USA, November 13-18, 2022}, pages = {22--30}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ExaMPI56604.2022.00008}, doi = {10.1109/EXAMPI56604.2022.00008}, timestamp = {Mon, 13 Feb 2023 21:53:09 +0100}, biburl = {https://dblp.org/rec/conf/exampi/CaoGH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/fccm/LichtPZSH22, author = {Johannes de Fine Licht and Christopher A. Pattison and Alexandros Nikolaos Ziogas and David Simmons{-}Duffin and Torsten Hoefler}, title = {Fast Arbitrary Precision Floating Point on {FPGA}}, booktitle = {30th {IEEE} Annual International Symposium on Field-Programmable Custom Computing Machines, {FCCM} 2022, New York City, NY, USA, May 15-18, 2022}, pages = {1--9}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/FCCM53951.2022.9786219}, doi = {10.1109/FCCM53951.2022.9786219}, timestamp = {Mon, 13 Jun 2022 16:53:36 +0200}, biburl = {https://dblp.org/rec/conf/fccm/LichtPZSH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccad/JohnsenMBLH22, author = {Carl{-}Johannes Johnsen and Tiziano De Matteis and Tal Ben{-}Nun and Johannes de Fine Licht and Torsten Hoefler}, editor = {Tulika Mitra and Evangeline F. Y. Young and Jinjun Xiong}, title = {Temporal Vectorization: {A} Compiler Approach to Automatic Multi-Pumping}, booktitle = {Proceedings of the 41st {IEEE/ACM} International Conference on Computer-Aided Design, {ICCAD} 2022, San Diego, California, USA, 30 October 2022 - 3 November 2022}, pages = {85:1--85:9}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3508352.3549374}, doi = {10.1145/3508352.3549374}, timestamp = {Tue, 06 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iccad/JohnsenMBLH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PlummerDFHS22, author = {Bryan A. Plummer and Nikoli Dryden and Julius Frost and Torsten Hoefler and Kate Saenko}, title = {Neural Parameter Allocation Search}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=srtIXtySfT4}, timestamp = {Sat, 20 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PlummerDFHS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/SchmidCCWRSKH22, author = {Larissa Schmid and Marcin Copik and Alexandru Calotoiu and Dominik Werle and Andreas Reiter and Michael Selzer and Anne Koziolek and Torsten Hoefler}, editor = {Lawrence Rauchwerger and Kirk W. Cameron and Dimitrios S. Nikolopoulos and Dionisios N. Pnevmatikatos}, title = {Performance-detective: automatic deduction of cheap and accurate performance models}, booktitle = {{ICS} '22: 2022 International Conference on Supercomputing, Virtual Event, June 28 - 30, 2022}, pages = {3:1--3:13}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3524059.3532391}, doi = {10.1145/3524059.3532391}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ics/SchmidCCWRSKH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/CalotoiuBKLSSH22, author = {Alexandru Calotoiu and Tal Ben{-}Nun and Grzegorz Kwasniewski and Johannes de Fine Licht and Timo Schneider and Philipp Schaad and Torsten Hoefler}, editor = {Lawrence Rauchwerger and Kirk W. Cameron and Dimitrios S. Nikolopoulos and Dionisios N. Pnevmatikatos}, title = {Lifting {C} semantics for dataflow optimization}, booktitle = {{ICS} '22: 2022 International Conference on Supercomputing, Virtual Event, June 28 - 30, 2022}, pages = {17:1--17:13}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3524059.3532389}, doi = {10.1145/3524059.3532389}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ics/CalotoiuBKLSSH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/RauschBDI0H22, author = {Oliver Rausch and Tal Ben{-}Nun and Nikoli Dryden and Andrei Ivanov and Shigang Li and Torsten Hoefler}, editor = {Lawrence Rauchwerger and Kirk W. Cameron and Dimitrios S. Nikolopoulos and Dionisios N. Pnevmatikatos}, title = {A data-centric optimization framework for machine learning}, booktitle = {{ICS} '22: 2022 International Conference on Supercomputing, Virtual Event, June 28 - 30, 2022}, pages = {36:1--36:13}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3524059.3532364}, doi = {10.1145/3524059.3532364}, timestamp = {Wed, 22 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ics/RauschBDI0H22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icst/LascuDGH22, author = {Andrei Lascu and Alastair F. Donaldson and Tobias Grosser and Torsten Hoefler}, title = {Metamorphic Fuzzing of {C++} Libraries}, booktitle = {15th {IEEE} Conference on Software Testing, Verification and Validation, {ICST} 2022, Valencia, Spain, April 4-14, 2022}, pages = {35--46}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICST53961.2022.00015}, doi = {10.1109/ICST53961.2022.00015}, timestamp = {Mon, 13 Jun 2022 16:53:36 +0200}, biburl = {https://dblp.org/rec/conf/icst/LascuDGH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/GleinigBH22, author = {Niels Gleinig and Maciej Besta and Torsten Hoefler}, title = {I/O-Optimal Cache-Oblivious Sparse Matrix-Sparse Matrix Multiplication}, booktitle = {2022 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2022, Lyon, France, May 30 - June 3, 2022}, pages = {36--46}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/IPDPS53621.2022.00013}, doi = {10.1109/IPDPS53621.2022.00013}, timestamp = {Fri, 22 Jul 2022 11:14:30 +0200}, biburl = {https://dblp.org/rec/conf/ipps/GleinigBH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/StrauszVGBH22, author = {Andr{\'{a}}s Strausz and Flavio Vella and Salvatore Di Girolamo and Maciej Besta and Torsten Hoefler}, title = {Asynchronous Distributed-Memory Triangle Counting and {LCC} with {RMA} Caching}, booktitle = {2022 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2022, Lyon, France, May 30 - June 3, 2022}, pages = {291--301}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/IPDPS53621.2022.00036}, doi = {10.1109/IPDPS53621.2022.00036}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/StrauszVGBH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/kdd/BestaGMBKGKAGDH22, author = {Maciej Besta and Raphael Grob and Cesare Miglioli and Nicola Bernold and Grzegorz Kwasniewski and Gabriel Gjini and Raghavendra Kanakagiri and Saleh Ashkboos and Lukas Gianinazzi and Nikoli Dryden and Torsten Hoefler}, editor = {Aidong Zhang and Huzefa Rangwala}, title = {Motif Prediction with Graph Neural Networks}, booktitle = {{KDD} '22: The 28th {ACM} {SIGKDD} Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022}, pages = {35--45}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3534678.3539343}, doi = {10.1145/3534678.3539343}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/kdd/BestaGMBKGKAGDH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/log/BestaISODPCH22, author = {Maciej Besta and Patrick Iff and Florian Scheidl and Kazuki Osawa and Nikoli Dryden and Michal Podstawski and Tiancheng Chen and Torsten Hoefler}, editor = {Bastian Rieck and Razvan Pascanu}, title = {Neural Graph Databases}, booktitle = {Learning on Graphs Conference, LoG 2022, 9-12 December 2022, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {198}, pages = {31}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v198/besta22a.html}, timestamp = {Fri, 17 Feb 2023 16:29:10 +0100}, biburl = {https://dblp.org/rec/conf/log/BestaISODPCH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/AshkboosHDBDGKH22, author = {Saleh Ashkboos and Langwen Huang and Nikoli Dryden and Tal Ben{-}Nun and Peter Dueben and Lukas Gianinazzi and Luca Kummer and Torsten Hoefler}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {{ENS-10:} {A} Dataset For Post-Processing Ensemble Weather Forecasts}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/89e44582fd28ddfea1ea4dcb0ebbf4b0-Abstract-Datasets\_and\_Benchmarks.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/AshkboosHDBDGKH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DrydenH22, author = {Nikoli Dryden and Torsten Hoefler}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Spatial Mixture-of-Experts}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/4c5e2bcbf21bdf40d75fddad0bd43dc9-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/DrydenH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/0002H22, author = {Shigang Li and Torsten Hoefler}, editor = {Jaejin Lee and Kunal Agrawal and Michael F. Spear}, title = {Near-optimal sparse allreduce for distributed deep learning}, booktitle = {PPoPP '22: 27th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, Seoul, Republic of Korea, April 2 - 6, 2022}, pages = {135--149}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3503221.3508399}, doi = {10.1145/3503221.3508399}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/0002H22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/GirolamoSTMBSKH22, author = {Salvatore Di Girolamo and Daniele De Sensi and Konstantin Taranov and Milos Malesevic and Maciej Besta and Timo Schneider and Severin Kistler and Torsten Hoefler}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {Building Blocks for Network-Accelerated Distributed File Systems}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {10:1--10:14}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00015}, doi = {10.1109/SC41404.2022.00015}, timestamp = {Wed, 24 May 2023 16:17:06 +0200}, biburl = {https://dblp.org/rec/conf/sc/GirolamoSTMBSKH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerBSGLHBGCS22, author = {Torsten Hoefler and Tommaso Bonato and Daniele De Sensi and Salvatore Di Girolamo and Shigang Li and Marco Heddes and Jon Belk and Deepak Goel and Miguel Castro and Steve Scott}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {HammingMesh: {A} Network Topology for Large-Scale Deep Learning}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {11:1--11:18}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00016}, doi = {10.1109/SC41404.2022.00016}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/HoeflerBSGLHBGCS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/LakhotiaBMIIHP22, author = {Kartik Lakhotia and Maciej Besta and Laura Monroe and Kelly Isham and Patrick Iff and Torsten Hoefler and Fabrizio Petrini}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {PolarFly: {A} Cost-Effective and Flexible Low-Diameter Topology}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {12:1--12:15}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00017}, doi = {10.1109/SC41404.2022.00017}, timestamp = {Wed, 24 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/LakhotiaBMIIHP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/ZiogasKBSH22, author = {Alexandros Nikolaos Ziogas and Grzegorz Kwasniewski and Tal Ben{-}Nun and Timo Schneider and Torsten Hoefler}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {Deinsum: Practically {I/O} Optimal Multi-Linear Algebra}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {25:1--25:15}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00030}, doi = {10.1109/SC41404.2022.00030}, timestamp = {Wed, 24 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/ZiogasKBSH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/LiOH22, author = {Shigang Li and Kazuki Osawa and Torsten Hoefler}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {Efficient Quantized Sparse Matrix Operations on Tensor Cores}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {37:1--37:15}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00042}, doi = {10.1109/SC41404.2022.00042}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/LiOH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaMLTIKAJPKGVMH22, author = {Maciej Besta and Cesare Miglioli and Paolo Sylos Labini and Jakub Tetek and Patrick Iff and Raghavendra Kanakagiri and Saleh Ashkboos and Kacper Janda and Michal Podstawski and Grzegorz Kwasniewski and Niels Gleinig and Flavio Vella and Onur Mutlu and Torsten Hoefler}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {ProbGraph: High-Performance and High-Accuracy Graph Mining with Probabilistic Set Representations}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {43:1--43:17}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00048}, doi = {10.1109/SC41404.2022.00048}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/BestaMLTIKAJPKGVMH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/SchaadBH22, author = {Philipp Schaad and Tal Ben{-}Nun and Torsten Hoefler}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {Boosting Performance Optimization with Interactive Data Movement Visualization}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {64:1--64:16}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00069}, doi = {10.1109/SC41404.2022.00069}, timestamp = {Wed, 24 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/SchaadBH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BenNunGDWDDEGMTWFSH22, author = {Tal Ben{-}Nun and Linus Groner and Florian Deconinck and Tobias Wicky and Eddie Davis and Johann Dahm and Oliver Elbert and Rhea George and Jeremy McGibbon and Lukas Tr{\"{u}}mper and Elynn Wu and Oliver Fuhrer and Thomas C. Schulthess and Torsten Hoefler}, editor = {Felix Wolf and Sameer Shende and Candace Culhane and Sadaf R. Alam and Heike Jagode}, title = {Productive Performance Engineering for Weather and Climate Modeling with Python}, booktitle = {{SC22:} International Conference for High Performance Computing, Networking, Storage and Analysis, Dallas, TX, USA, November 13-18, 2022}, pages = {73:1--73:14}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SC41404.2022.00078}, doi = {10.1109/SC41404.2022.00078}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/BenNunGDWDDEGMTWFSH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigmod/TaranovBMH22, author = {Konstantin Taranov and Steve Byan and Virendra J. Marathe and Torsten Hoefler}, editor = {Zachary G. Ives and Angela Bonifati and Amr El Abbadi}, title = {KafkaDirect: Zero-copy Data Access for Apache Kafka over {RDMA} Networks}, booktitle = {{SIGMOD} '22: International Conference on Management of Data, Philadelphia, PA, USA, June 12 - 17, 2022}, pages = {2191--2204}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3514221.3526056}, doi = {10.1145/3514221.3526056}, timestamp = {Thu, 16 Mar 2023 09:51:25 +0100}, biburl = {https://dblp.org/rec/conf/sigmod/TaranovBMH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sirocco/GleinigH22, author = {Niels Gleinig and Torsten Hoefler}, editor = {Merav Parter}, title = {The Red-Blue Pebble Game on Trees and DAGs with Large Input}, booktitle = {Structural Information and Communication Complexity - 29th International Colloquium, {SIROCCO} 2022, Paderborn, Germany, June 27-29, 2022, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {13298}, pages = {135--153}, publisher = {Springer}, year = {2022}, url = {https://doi.org/10.1007/978-3-031-09993-9\_8}, doi = {10.1007/978-3-031-09993-9\_8}, timestamp = {Tue, 28 Jun 2022 16:23:40 +0200}, biburl = {https://dblp.org/rec/conf/sirocco/GleinigH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-07598, author = {Shigang Li and Torsten Hoefler}, title = {Near-Optimal Sparse Allreduce for Distributed Deep Learning}, journal = {CoRR}, volume = {abs/2201.07598}, year = {2022}, url = {https://arxiv.org/abs/2201.07598}, eprinttype = {arXiv}, eprint = {2201.07598}, timestamp = {Fri, 21 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-07598.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-08080, author = {Konstantin Taranov and Benjamin Rothenberger and Daniele De Sensi and Adrian Perrig and Torsten Hoefler}, title = {NeVerMore: Exploiting {RDMA} Mistakes in NVMe-oF Storage Applications}, journal = {CoRR}, volume = {abs/2202.08080}, year = {2022}, url = {https://arxiv.org/abs/2202.08080}, eprinttype = {arXiv}, eprint = {2202.08080}, timestamp = {Tue, 01 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-08080.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-13976, author = {Andr{\'{a}}s Strausz and Flavio Vella and Salvatore Di Girolamo and Maciej Besta and Torsten Hoefler}, title = {Asynchronous Distributed-Memory Triangle Counting and {LCC} with {RMA} Caching}, journal = {CoRR}, volume = {abs/2202.13976}, year = {2022}, url = {https://arxiv.org/abs/2202.13976}, eprinttype = {arXiv}, eprint = {2202.13976}, timestamp = {Thu, 03 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-13976.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-14859, author = {Marcin Copik and Alexandru Calotoiu and Konstantin Taranov and Torsten Hoefler}, title = {FaasKeeper: a Blueprint for Serverless Services}, journal = {CoRR}, volume = {abs/2203.14859}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.14859}, doi = {10.48550/ARXIV.2203.14859}, eprinttype = {arXiv}, eprint = {2203.14859}, timestamp = {Mon, 04 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-14859.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-06256, author = {Johannes de Fine Licht and Christopher A. Pattison and Alexandros Nikolaos Ziogas and David Simmons{-}Duffin and Torsten Hoefler}, title = {Fast Arbitrary Precision Floating Point on {FPGA}}, journal = {CoRR}, volume = {abs/2204.06256}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.06256}, doi = {10.48550/ARXIV.2204.06256}, eprinttype = {arXiv}, eprint = {2204.06256}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-06256.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-04148, author = {Tal Ben{-}Nun and Linus Groner and Florian Deconinck and Tobias Wicky and Eddie Davis and Johann Dahm and Oliver Elbert and Rhea George and Jeremy McGibbon and Lukas Tr{\"{u}}mper and Elynn Wu and Oliver Fuhrer and Thomas C. Schulthess and Torsten Hoefler}, title = {Productive Performance Engineering for Weather and Climate Modeling with Python}, journal = {CoRR}, volume = {abs/2205.04148}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.04148}, doi = {10.48550/ARXIV.2205.04148}, eprinttype = {arXiv}, eprint = {2205.04148}, timestamp = {Wed, 11 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-04148.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-04934, author = {Lukas Gianinazzi and Tal Ben{-}Nun and Saleh Ashkboos and Yves Baumann and Piotr Luczynski and Torsten Hoefler}, title = {The spatial computer: {A} model for energy-efficient parallel computation}, journal = {CoRR}, volume = {abs/2205.04934}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.04934}, doi = {10.48550/ARXIV.2205.04934}, eprinttype = {arXiv}, eprint = {2205.04934}, timestamp = {Wed, 11 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-04934.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-09702, author = {Maciej Besta and Torsten Hoefler}, title = {Parallel and Distributed Graph Neural Networks: An In-Depth Concurrency Analysis}, journal = {CoRR}, volume = {abs/2205.09702}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.09702}, doi = {10.48550/ARXIV.2205.09702}, eprinttype = {arXiv}, eprint = {2205.09702}, timestamp = {Mon, 23 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-09702.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-08301, author = {Alexandros Nikolaos Ziogas and Grzegorz Kwasniewski and Tal Ben{-}Nun and Timo Schneider and Torsten Hoefler}, title = {Deinsum: Practically {I/O} Optimal Multilinear Algebra}, journal = {CoRR}, volume = {abs/2206.08301}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.08301}, doi = {10.48550/ARXIV.2206.08301}, eprinttype = {arXiv}, eprint = {2206.08301}, timestamp = {Tue, 21 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-08301.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-10007, author = {Salvatore Di Girolamo and Daniele De Sensi and Konstantin Taranov and Milos Malesevic and Maciej Besta and Timo Schneider and Severin Kistler and Torsten Hoefler}, title = {Building Blocks for Network-Accelerated Distributed File Systems}, journal = {CoRR}, volume = {abs/2206.10007}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.10007}, doi = {10.48550/ARXIV.2206.10007}, eprinttype = {arXiv}, eprint = {2206.10007}, timestamp = {Mon, 27 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-10007.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-14786, author = {Saleh Ashkboos and Langwen Huang and Nikoli Dryden and Tal Ben{-}Nun and Peter Dueben and Lukas Gianinazzi and Luca Kummer and Torsten Hoefler}, title = {{ENS-10:} {A} Dataset For Post-Processing Ensemble Weather Forecast}, journal = {CoRR}, volume = {abs/2206.14786}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.14786}, doi = {10.48550/ARXIV.2206.14786}, eprinttype = {arXiv}, eprint = {2206.14786}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-14786.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2207-07433, author = {Philipp Schaad and Tal Ben{-}Nun and Torsten Hoefler}, title = {Boosting Performance Optimization with Interactive Data Movement Visualization}, journal = {CoRR}, volume = {abs/2207.07433}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2207.07433}, doi = {10.48550/ARXIV.2207.07433}, eprinttype = {arXiv}, eprint = {2207.07433}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2207-07433.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2208-01695, author = {Kartik Lakhotia and Maciej Besta and Laura Monroe and Kelly Isham and Patrick Iff and Torsten Hoefler and Fabrizio Petrini}, title = {PolarFly: {A} Cost-Effective and Flexible Low-Diameter Topology}, journal = {CoRR}, volume = {abs/2208.01695}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2208.01695}, doi = {10.48550/ARXIV.2208.01695}, eprinttype = {arXiv}, eprint = {2208.01695}, timestamp = {Tue, 09 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2208-01695.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2208-11469, author = {Maciej Besta and Cesare Miglioli and Paolo Sylos Labini and Jakub Tetek and Patrick Iff and Raghavendra Kanakagiri and Saleh Ashkboos and Kacper Janda and Michal Podstawski and Grzegorz Kwasniewski and Niels Gleinig and Flavio Vella and Onur Mutlu and Torsten Hoefler}, title = {ProbGraph: High-Performance and High-Accuracy Graph Mining with Probabilistic Set Representations}, journal = {CoRR}, volume = {abs/2208.11469}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2208.11469}, doi = {10.48550/ARXIV.2208.11469}, eprinttype = {arXiv}, eprint = {2208.11469}, timestamp = {Tue, 30 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2208-11469.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-01346, author = {Torsten Hoefler and Tommaso Bonato and Daniele De Sensi and Salvatore Di Girolamo and Shigang Li and Marco Heddes and Jon Belk and Deepak Goel and Miguel Castro and Steve Scott}, title = {HammingMesh: {A} Network Topology for Large-Scale Deep Learning}, journal = {CoRR}, volume = {abs/2209.01346}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.01346}, doi = {10.48550/ARXIV.2209.01346}, eprinttype = {arXiv}, eprint = {2209.01346}, timestamp = {Thu, 09 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-01346.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-03125, author = {Andrei Ivanov and Benjamin Rothenberger and Arnaud Dethise and Marco Canini and Torsten Hoefler and Adrian Perrig}, title = {{SAGE:} Software-based Attestation for {GPU} Execution}, journal = {CoRR}, volume = {abs/2209.03125}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.03125}, doi = {10.48550/ARXIV.2209.03125}, eprinttype = {arXiv}, eprint = {2209.03125}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-03125.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-06979, author = {Shigang Li and Kazuki Osawa and Torsten Hoefler}, title = {Efficient Quantized Sparse Matrix Operations on Tensor Cores}, journal = {CoRR}, volume = {abs/2209.06979}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.06979}, doi = {10.48550/ARXIV.2209.06979}, eprinttype = {arXiv}, eprint = {2209.06979}, timestamp = {Tue, 27 Sep 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-06979.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-09732, author = {Maciej Besta and Patrick Iff and Florian Scheidl and Kazuki Osawa and Nikoli Dryden and Michal Podstawski and Tiancheng Chen and Torsten Hoefler}, title = {Neural Graph Databases}, journal = {CoRR}, volume = {abs/2209.09732}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.09732}, doi = {10.48550/ARXIV.2209.09732}, eprinttype = {arXiv}, eprint = {2209.09732}, timestamp = {Wed, 28 Sep 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-09732.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-04598, author = {Carl{-}Johannes Johnsen and Tiziano De Matteis and Tal Ben{-}Nun and Johannes de Fine Licht and Torsten Hoefler}, title = {Temporal Vectorization: {A} Compiler Approach to Automatic Multi-Pumping}, journal = {CoRR}, volume = {abs/2210.04598}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.04598}, doi = {10.48550/ARXIV.2210.04598}, eprinttype = {arXiv}, eprint = {2210.04598}, timestamp = {Thu, 13 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-04598.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-12538, author = {Langwen Huang and Torsten Hoefler}, title = {Compressing multidimensional weather and climate data into neural networks}, journal = {CoRR}, volume = {abs/2210.12538}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.12538}, doi = {10.48550/ARXIV.2210.12538}, eprinttype = {arXiv}, eprint = {2210.12538}, timestamp = {Fri, 28 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-12538.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-15315, author = {Daniele De Sensi and Tiziano De Matteis and Konstantin Taranov and Salvatore Di Girolamo and Tobias Rahn and Torsten Hoefler}, title = {Noise in the Clouds: Influence of Network Performance Variability on Application Scalability}, journal = {CoRR}, volume = {abs/2210.15315}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.15315}, doi = {10.48550/ARXIV.2210.15315}, eprinttype = {arXiv}, eprint = {2210.15315}, timestamp = {Wed, 02 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-15315.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-17323, author = {Elias Frantar and Saleh Ashkboos and Torsten Hoefler and Dan Alistarh}, title = {{GPTQ:} Accurate Post-Training Quantization for Generative Pre-trained Transformers}, journal = {CoRR}, volume = {abs/2210.17323}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.17323}, doi = {10.48550/ARXIV.2210.17323}, eprinttype = {arXiv}, eprint = {2210.17323}, timestamp = {Thu, 03 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-17323.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-07629, author = {Michael E. Beverland and Prakash Murali and Matthias Troyer and Krysta M. Svore and Torsten Hoefler and Vadym Kliuchnikov and Guang Hao Low and Mathias Soeken and Aarthi Sundaram and Alexander Vaschillo}, title = {Assessing requirements to scale to practical quantum advantage}, journal = {CoRR}, volume = {abs/2211.07629}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.07629}, doi = {10.48550/ARXIV.2211.07629}, eprinttype = {arXiv}, eprint = {2211.07629}, timestamp = {Wed, 16 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-07629.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-13491, author = {Nikoli Dryden and Torsten Hoefler}, title = {Spatial Mixture-of-Experts}, journal = {CoRR}, volume = {abs/2211.13491}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.13491}, doi = {10.48550/ARXIV.2211.13491}, eprinttype = {arXiv}, eprint = {2211.13491}, timestamp = {Tue, 29 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-13491.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-13980, author = {Patrick Iff and Maciej Besta and Matheus A. Cavalcante and Tim Fischer and Luca Benini and Torsten Hoefler}, title = {Sparse Hamming Graph: {A} Customizable Network-on-Chip Topology}, journal = {CoRR}, volume = {abs/2211.13980}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.13980}, doi = {10.48550/ARXIV.2211.13980}, eprinttype = {arXiv}, eprint = {2211.13980}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-13980.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-13989, author = {Patrick Iff and Maciej Besta and Matheus A. Cavalcante and Tim Fischer and Luca Benini and Torsten Hoefler}, title = {HexaMesh: Scaling to Hundreds of Chiplets with an Optimized Chiplet Arrangement}, journal = {CoRR}, volume = {abs/2211.13989}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.13989}, doi = {10.48550/ARXIV.2211.13989}, eprinttype = {arXiv}, eprint = {2211.13989}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-13989.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-14133, author = {Kazuki Osawa and Shigang Li and Torsten Hoefler}, title = {PipeFisher: Efficient Training of Large Language Models Using Pipelining and Fisher Information Matrices}, journal = {CoRR}, volume = {abs/2211.14133}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.14133}, doi = {10.48550/ARXIV.2211.14133}, eprinttype = {arXiv}, eprint = {2211.14133}, timestamp = {Tue, 29 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-14133.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-09134, author = {Konstantin Taranov and Fabian Fischer and Torsten Hoefler}, title = {Efficient {RDMA} Communication Protocols}, journal = {CoRR}, volume = {abs/2212.09134}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.09134}, doi = {10.48550/ARXIV.2212.09134}, eprinttype = {arXiv}, eprint = {2212.09134}, timestamp = {Tue, 10 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-09134.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-13768, author = {Johannes de Fine Licht and Tiziano De Matteis and Tal Ben{-}Nun and Andreas Kuster and Oliver Rausch and Manuel Burger and Carl{-}Johannes Johnsen and Torsten Hoefler}, title = {Python {FPGA} Programming with Data-Centric Multi-Level Design}, journal = {CoRR}, volume = {abs/2212.13768}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.13768}, doi = {10.48550/ARXIV.2212.13768}, eprinttype = {arXiv}, eprint = {2212.13768}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-13768.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/HoeflerABDP21, author = {Torsten Hoefler and Dan Alistarh and Tal Ben{-}Nun and Nikoli Dryden and Alexandra Peste}, title = {Sparsity in Deep Learning: Pruning and growth for efficient inference and training in neural networks}, journal = {J. Mach. Learn. Res.}, volume = {22}, pages = {241:1--241:124}, year = {2021}, url = {http://jmlr.org/papers/v22/21-0366.html}, timestamp = {Mon, 31 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jmlr/HoeflerABDP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ncs/BauerDHQSW21, author = {Peter Bauer and Peter D. D{\"{u}}ben and Torsten Hoefler and Tiago Quintino and Thomas C. Schulthess and Nils P. Wedi}, title = {The digital revolution of Earth-system science}, journal = {Nat. Comput. Sci.}, volume = {1}, number = {2}, pages = {104--113}, year = {2021}, url = {https://doi.org/10.1038/s43588-021-00023-0}, doi = {10.1038/S43588-021-00023-0}, timestamp = {Mon, 15 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ncs/BauerDHQSW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pacmpl/PitchanathanUWH21, author = {Arjun Pitchanathan and Christian Ulmann and Michel Weber and Torsten Hoefler and Tobias Grosser}, title = {{FPL:} fast Presburger arithmetic through transprecision}, journal = {Proc. {ACM} Program. Lang.}, volume = {5}, number = {{OOPSLA}}, pages = {1--26}, year = {2021}, url = {https://doi.org/10.1145/3485539}, doi = {10.1145/3485539}, timestamp = {Wed, 25 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pacmpl/PitchanathanUWH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pomacs/SensiMTGRH21, author = {Daniele De Sensi and Tiziano De Matteis and Konstantin Taranov and Salvatore Di Girolamo and Tobias Rahn and Torsten Hoefler}, title = {Noise in the Clouds: Influence of Network Performance Variability on Application Scalability}, journal = {Proc. {ACM} Meas. Anal. Comput. Syst.}, volume = {6}, number = {3}, pages = {49:1--49:27}, year = {2021}, url = {https://doi.org/10.1145/3570609}, doi = {10.1145/3570609}, timestamp = {Sun, 15 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/pomacs/SensiMTGRH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pvldb/BestaVSSKGBJHLT21, author = {Maciej Besta and Zur Vonarburg{-}Shmaria and Yannick Schaffner and Leonardo Schwarz and Grzegorz Kwasniewski and Lukas Gianinazzi and Jakub Ber{\'{a}}nek and Kacper Janda and Tobias Holenstein and Sebastian Leisinger and Peter Tatkowski and Esref {\"{O}}zdemir and Adrian Balla and Marcin Copik and Philipp Lindenberger and Marek Konieczny and Onur Mutlu and Torsten Hoefler}, title = {GraphMineSuite: Enabling High-Performance and Programmable Graph Mining Algorithms with Set Algebra}, journal = {Proc. {VLDB} Endow.}, volume = {14}, number = {11}, pages = {1922--1936}, year = {2021}, url = {http://www.vldb.org/pvldb/vol14/p1922-besta.pdf}, doi = {10.14778/3476249.3476252}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pvldb/BestaVSSKGBJHLT21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/siamsc/SolomonikDH21, author = {Edgar Solomonik and James Demmel and Torsten Hoefler}, title = {Communication Lower Bounds of Bilinear Algorithms for Symmetric Tensor Contractions}, journal = {{SIAM} J. Sci. Comput.}, volume = {43}, number = {5}, pages = {A3328--A3356}, year = {2021}, url = {https://doi.org/10.1137/20M1338599}, doi = {10.1137/20M1338599}, timestamp = {Fri, 03 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/siamsc/SolomonikDH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taco/GysiMZHDWFHG21, author = {Tobias Gysi and Christoph M{\"{u}}ller and Oleksandr Zinenko and Stephan Herhut and Eddie Davis and Tobias Wicky and Oliver Fuhrer and Torsten Hoefler and Tobias Grosser}, title = {Domain-Specific Multi-Level {IR} Rewriting for {GPU:} The Open Earth Compiler for GPU-accelerated Climate Simulation}, journal = {{ACM} Trans. Archit. Code Optim.}, volume = {18}, number = {4}, pages = {51:1--51:23}, year = {2021}, url = {https://doi.org/10.1145/3469030}, doi = {10.1145/3469030}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/taco/GysiMZHDWFHG21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tc/SchuikiZHB21, author = {Fabian Schuiki and Florian Zaruba and Torsten Hoefler and Luca Benini}, title = {Stream Semantic Registers: {A} Lightweight {RISC-V} {ISA} Extension Achieving Full Compute Utilization in Single-Issue Cores}, journal = {{IEEE} Trans. Computers}, volume = {70}, number = {2}, pages = {212--227}, year = {2021}, url = {https://doi.org/10.1109/TC.2020.2987314}, doi = {10.1109/TC.2020.2987314}, timestamp = {Tue, 26 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tc/SchuikiZHB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tc/ZarubaSHB21, author = {Florian Zaruba and Fabian Schuiki and Torsten Hoefler and Luca Benini}, title = {Snitch: {A} Tiny Pseudo Dual-Issue Processor for Area and Energy Efficient Execution of Floating-Point Intensive Workloads}, journal = {{IEEE} Trans. Computers}, volume = {70}, number = {11}, pages = {1845--1860}, year = {2021}, url = {https://doi.org/10.1109/TC.2020.3027900}, doi = {10.1109/TC.2020.3027900}, timestamp = {Wed, 03 Nov 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tc/ZarubaSHB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/BestaDSKGSSH21, author = {Maciej Besta and Jens Domke and Marcel Schneider and Marek Konieczny and Salvatore Di Girolamo and Timo Schneider and Ankit Singla and Torsten Hoefler}, title = {High-Performance Routing With Multipathing and Path Diversity in Ethernet and {HPC} Networks}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {32}, number = {4}, pages = {943--959}, year = {2021}, url = {https://doi.org/10.1109/TPDS.2020.3035761}, doi = {10.1109/TPDS.2020.3035761}, timestamp = {Sun, 25 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tpds/BestaDSKGSSH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/LichtBMH21, author = {Johannes de Fine Licht and Maciej Besta and Simon Meierhans and Torsten Hoefler}, title = {Transformations of High-Level Synthesis Codes for High-Performance Computing}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {32}, number = {5}, pages = {1014--1029}, year = {2021}, url = {https://doi.org/10.1109/TPDS.2020.3039409}, doi = {10.1109/TPDS.2020.3039409}, timestamp = {Tue, 26 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tpds/LichtBMH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/LiBNGDAH21, author = {Shigang Li and Tal Ben{-}Nun and Giorgi Nadiradze and Salvatore Di Girolamo and Nikoli Dryden and Dan Alistarh and Torsten Hoefler}, title = {Breaking (Global) Barriers in Parallel Stochastic Optimization With Wait-Avoiding Group Averaging}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {32}, number = {7}, pages = {1725--1739}, year = {2021}, url = {https://doi.org/10.1109/TPDS.2020.3040606}, doi = {10.1109/TPDS.2020.3040606}, timestamp = {Tue, 02 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tpds/LiBNGDAH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ant/GraurBBRSHA21, author = {Dan Graur and Rodrigo Bruno and Joschka Bischoff and Marcel Rieser and Wolfgang Scherr and Torsten Hoefler and Gustavo Alonso}, editor = {Elhadi M. Shakshuki and Ansar{-}Ul{-}Haque Yasar}, title = {Hermes: Enabling efficient large-scale simulation in MATSim}, booktitle = {The 12th International Conference on Ambient Systems, Networks and Technologies {(ANT} 2021) / The 4th International Conference on Emerging Data and Industry 4.0 {(EDI40} 2021) / Affiliated Workshops, March 23-26, 2021, Warsaw, Poland}, series = {Procedia Computer Science}, volume = {184}, pages = {635--641}, publisher = {Elsevier}, year = {2021}, url = {https://doi.org/10.1016/j.procs.2021.03.079}, doi = {10.1016/J.PROCS.2021.03.079}, timestamp = {Wed, 27 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ant/GraurBBRSHA21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cgo/LichtKMBHH21, author = {Johannes de Fine Licht and Andreas Kuster and Tiziano De Matteis and Tal Ben{-}Nun and Dominic Hofer and Torsten Hoefler}, editor = {Jae W. Lee and Mary Lou Soffa and Ayal Zaks}, title = {StencilFlow: Mapping Large Stencil Programs to Distributed Spatial Computing Systems}, booktitle = {{IEEE/ACM} International Symposium on Code Generation and Optimization, {CGO} 2021, Seoul, South Korea, February 27 - March 3, 2021}, pages = {315--326}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/CGO51591.2021.9370315}, doi = {10.1109/CGO51591.2021.9370315}, timestamp = {Sat, 09 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cgo/LichtKMBHH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dac/GleinigH21, author = {Niels Gleinig and Torsten Hoefler}, title = {An Efficient Algorithm for Sparse Quantum State Preparation}, booktitle = {58th {ACM/IEEE} Design Automation Conference, {DAC} 2021, San Francisco, CA, USA, December 5-9, 2021}, pages = {433--438}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/DAC18074.2021.9586240}, doi = {10.1109/DAC18074.2021.9586240}, timestamp = {Fri, 12 Nov 2021 12:31:50 +0100}, biburl = {https://dblp.org/rec/conf/dac/GleinigH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/date/SchefflerZSHB21, author = {Paul Scheffler and Florian Zaruba and Fabian Schuiki and Torsten Hoefler and Luca Benini}, title = {Indirection Stream Semantic Register Architecture for Efficient Sparse-Dense Linear Algebra}, booktitle = {Design, Automation {\&} Test in Europe Conference {\&} Exhibition, {DATE} 2021, Grenoble, France, February 1-5, 2021}, pages = {1787--1792}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.23919/DATE51398.2021.9474230}, doi = {10.23919/DATE51398.2021.9474230}, timestamp = {Wed, 21 Jul 2021 10:04:34 +0200}, biburl = {https://dblp.org/rec/conf/date/SchefflerZSHB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/CumminsFBHOL21, author = {Chris Cummins and Zacharias V. Fisches and Tal Ben{-}Nun and Torsten Hoefler and Michael F. P. O'Boyle and Hugh Leather}, editor = {Marina Meila and Tong Zhang}, title = {ProGraML: {A} Graph-based Program Representation for Data Flow Analysis and Compiler Optimizations}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {2244--2253}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/cummins21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/CumminsFBHOL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/ZiogasBSH21, author = {Alexandros Nikolaos Ziogas and Tal Ben{-}Nun and Timo Schneider and Torsten Hoefler}, editor = {Huiyang Zhou and Jose Moreira and Frank Mueller and Yoav Etsion}, title = {NPBench: a benchmarking suite for high-performance NumPy}, booktitle = {{ICS} '21: 2021 International Conference on Supercomputing, Virtual Event, USA, June 14-17, 2021}, pages = {63--74}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3447818.3460360}, doi = {10.1145/3447818.3460360}, timestamp = {Wed, 09 Jun 2021 15:33:33 +0200}, biburl = {https://dblp.org/rec/conf/ics/ZiogasBSH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/RitterGWCRH021, author = {Marcus Ritter and Alexander Gei{\ss} and Johannes Wehrstein and Alexandru Calotoiu and Thorsten Reimann and Torsten Hoefler and Felix Wolf}, title = {Noise-Resilient Empirical Performance Modeling with Deep Neural Networks}, booktitle = {35th {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2021, Portland, OR, USA, May 17-21, 2021}, pages = {23--34}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/IPDPS49936.2021.00012}, doi = {10.1109/IPDPS49936.2021.00012}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ipps/RitterGWCRH021.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isca/GirolamoKCBSBBH21, author = {Salvatore Di Girolamo and Andreas Kurth and Alexandru Calotoiu and Thomas Benz and Timo Schneider and Jakub Ber{\'{a}}nek and Luca Benini and Torsten Hoefler}, title = {A {RISC-V} in-network accelerator for flexible high-performance low-power packet processing}, booktitle = {48th {ACM/IEEE} Annual International Symposium on Computer Architecture, {ISCA} 2021, Virtual Event / Valencia, Spain, June 14-18, 2021}, pages = {958--971}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ISCA52012.2021.00079}, doi = {10.1109/ISCA52012.2021.00079}, timestamp = {Mon, 19 Feb 2024 07:32:07 +0100}, biburl = {https://dblp.org/rec/conf/isca/GirolamoKCBSBBH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/micro/BestaKKABKJVGSG21, author = {Maciej Besta and Raghavendra Kanakagiri and Grzegorz Kwasniewski and Rachata Ausavarungnirun and Jakub Ber{\'{a}}nek and Konstantinos Kanellopoulos and Kacper Janda and Zur Vonarburg{-}Shmaria and Lukas Gianinazzi and Ioana Stefan and Juan G{\'{o}}mez{-}Luna and Jakub Golinowski and Marcin Copik and Lukas Kapp{-}Schwoerer and Salvatore Di Girolamo and Nils Blach and Marek Konieczny and Onur Mutlu and Torsten Hoefler}, title = {{SISA:} Set-Centric Instruction Set Architecture for Graph Mining on Processing-in-Memory Systems}, booktitle = {{MICRO} '21: 54th Annual {IEEE/ACM} International Symposium on Microarchitecture, Virtual Event, Greece, October 18-22, 2021}, pages = {282--297}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3466752.3480133}, doi = {10.1145/3466752.3480133}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/micro/BestaKKABKJVGSG21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/middleware/CopikKBPH21, author = {Marcin Copik and Grzegorz Kwasniewski and Maciej Besta and Michal Podstawski and Torsten Hoefler}, editor = {Kaiwen Zhang and Abdelouahed Gherbi and Nalini Venkatasubramanian and Lu{\'{\i}}s Veiga}, title = {SeBS: a serverless benchmark suite for function-as-a-service computing}, booktitle = {Middleware '21: 22nd International Middleware Conference, Qu{\'{e}}bec City, Canada, December 6 - 10, 2021}, pages = {64--78}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3464298.3476133}, doi = {10.1145/3464298.3476133}, timestamp = {Sat, 09 Apr 2022 12:40:10 +0200}, biburl = {https://dblp.org/rec/conf/middleware/CopikKBPH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/mlsys/IvanovDB0H21, author = {Andrei Ivanov and Nikoli Dryden and Tal Ben{-}Nun and Shigang Li and Torsten Hoefler}, editor = {Alex Smola and Alex Dimakis and Ion Stoica}, title = {Data Movement Is All You Need: {A} Case Study on Optimizing Transformers}, booktitle = {Proceedings of Machine Learning and Systems 2021, MLSys 2021, virtual, April 5-9, 2021}, publisher = {mlsys.org}, year = {2021}, url = {https://proceedings.mlsys.org/paper/2021/hash/c9e1074f5b3f9fc8ea15d152add07294-Abstract.html}, timestamp = {Mon, 23 May 2022 11:55:02 +0200}, biburl = {https://dblp.org/rec/conf/mlsys/IvanovDB0H21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/CopikCGW0H21, author = {Marcin Copik and Alexandru Calotoiu and Tobias Grosser and Nicolas Wicki and Felix Wolf and Torsten Hoefler}, editor = {Jaejin Lee and Erez Petrank}, title = {Extracting clean performance models from tainted programs}, booktitle = {PPoPP '21: 26th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, Virtual Event, Republic of Korea, February 27- March 3, 2021}, pages = {403--417}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3437801.3441613}, doi = {10.1145/3437801.3441613}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/CopikCGW0H21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/KwasniewskiBZSB21, author = {Grzegorz Kwasniewski and Tal Ben{-}Nun and Alexandros Nikolaos Ziogas and Timo Schneider and Maciej Besta and Torsten Hoefler}, editor = {Jaejin Lee and Erez Petrank}, title = {On the parallel {I/O} optimality of linear algebra kernels: near-optimal {LU} factorization}, booktitle = {PPoPP '21: 26th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, Virtual Event, Republic of Korea, February 27- March 3, 2021}, pages = {463--464}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3437801.3441590}, doi = {10.1145/3437801.3441590}, timestamp = {Sun, 12 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/KwasniewskiBZSB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HanerSHT21, author = {Thomas H{\"{a}}ner and Damian S. Steiger and Torsten Hoefler and Matthias Troyer}, editor = {Bronis R. de Supinski and Mary W. Hall and Todd Gamblin}, title = {Distributed quantum computing with {QMPI}}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November 14-19, 2021}, pages = {16}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3458817.3476172}, doi = {10.1145/3458817.3476172}, timestamp = {Tue, 08 Nov 2022 16:03:02 +0100}, biburl = {https://dblp.org/rec/conf/sc/HanerSHT21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/0002H21, author = {Shigang Li and Torsten Hoefler}, editor = {Bronis R. de Supinski and Mary W. Hall and Todd Gamblin}, title = {Chimera: efficiently training large-scale neural networks with bidirectional pipelines}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November 14-19, 2021}, pages = {27}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3458817.3476145}, doi = {10.1145/3458817.3476145}, timestamp = {Tue, 08 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/0002H21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/SensiGA0H21, author = {Daniele De Sensi and Salvatore Di Girolamo and Saleh Ashkboos and Shigang Li and Torsten Hoefler}, editor = {Bronis R. de Supinski and Mary W. Hall and Todd Gamblin}, title = {Flare: flexible in-network allreduce}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November 14-19, 2021}, pages = {35}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3458817.3476178}, doi = {10.1145/3458817.3476178}, timestamp = {Tue, 08 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/SensiGA0H21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/KwasniewskiKBZS21, author = {Grzegorz Kwasniewski and Marko Kabic and Tal Ben{-}Nun and Alexandros Nikolaos Ziogas and Jens Eirik Saethre and Andr{\'{e}} Gaillard and Timo Schneider and Maciej Besta and Anton Kozhevnikov and Joost VandeVondele and Torsten Hoefler}, editor = {Bronis R. de Supinski and Mary W. Hall and Todd Gamblin}, title = {On the parallel {I/O} optimality of linear algebra kernels: near-optimal matrix factorizations}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November 14-19, 2021}, pages = {70}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3458817.3476167}, doi = {10.1145/3458817.3476167}, timestamp = {Tue, 08 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/KwasniewskiKBZS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/DrydenBBH21, author = {Nikoli Dryden and Roman B{\"{o}}hringer and Tal Ben{-}Nun and Torsten Hoefler}, editor = {Bronis R. de Supinski and Mary W. Hall and Todd Gamblin}, title = {Clairvoyant prefetching for distributed machine learning {I/O}}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November 14-19, 2021}, pages = {92}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3458817.3476181}, doi = {10.1145/3458817.3476181}, timestamp = {Tue, 08 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/DrydenBBH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/ZiogasSBCMLLH21, author = {Alexandros Nikolaos Ziogas and Timo Schneider and Tal Ben{-}Nun and Alexandru Calotoiu and Tiziano De Matteis and Johannes de Fine Licht and Luca Lavarini and Torsten Hoefler}, editor = {Bronis R. de Supinski and Mary W. Hall and Todd Gamblin}, title = {Productivity, portability, performance: data-centric Python}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November 14-19, 2021}, pages = {95}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3458817.3476176}, doi = {10.1145/3458817.3476176}, timestamp = {Tue, 08 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/ZiogasSBCMLLH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigmod/TaranovGH21, author = {Konstantin Taranov and Salvatore Di Girolamo and Torsten Hoefler}, editor = {Guoliang Li and Zhanhuai Li and Stratos Idreos and Divesh Srivastava}, title = {CoRM: Compactable Remote Memory over {RDMA}}, booktitle = {{SIGMOD} '21: International Conference on Management of Data, Virtual Event, China, June 20-25, 2021}, pages = {1811--1824}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3448016.3452817}, doi = {10.1145/3448016.3452817}, timestamp = {Mon, 21 Jun 2021 11:48:16 +0200}, biburl = {https://dblp.org/rec/conf/sigmod/TaranovGH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/GianinazziBSH21, author = {Lukas Gianinazzi and Maciej Besta and Yannick Schaffner and Torsten Hoefler}, editor = {Kunal Agrawal and Yossi Azar}, title = {Parallel Algorithms for Finding Large Cliques in Sparse Graphs}, booktitle = {{SPAA} '21: 33rd {ACM} Symposium on Parallelism in Algorithms and Architectures, Virtual Event, USA, 6-8 July, 2021}, pages = {243--253}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3409964.3461800}, doi = {10.1145/3409964.3461800}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/spaa/GianinazziBSH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/KwasniewskiBGCS21, author = {Grzegorz Kwasniewski and Tal Ben{-}Nun and Lukas Gianinazzi and Alexandru Calotoiu and Timo Schneider and Alexandros Nikolaos Ziogas and Maciej Besta and Torsten Hoefler}, editor = {Kunal Agrawal and Yossi Azar}, title = {Pebbles, Graphs, and a Pinch of Combinatorics: Towards Tight {I/O} Lower Bounds for Statically Analyzable Programs}, booktitle = {{SPAA} '21: 33rd {ACM} Symposium on Parallelism in Algorithms and Architectures, Virtual Event, USA, 6-8 July, 2021}, pages = {328--339}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3409964.3461796}, doi = {10.1145/3409964.3461796}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/spaa/KwasniewskiBGCS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/usenix/TaranovBAH21, author = {Konstantin Taranov and Rodrigo Bruno and Gustavo Alonso and Torsten Hoefler}, editor = {Irina Calciu and Geoff Kuenning}, title = {Naos: Serialization-free {RDMA} networking in Java}, booktitle = {2021 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2021, July 14-16, 2021}, pages = {1--14}, publisher = {{USENIX} Association}, year = {2021}, url = {https://www.usenix.org/conference/atc21/presentation/taranov}, timestamp = {Thu, 12 Aug 2021 18:08:26 +0200}, biburl = {https://dblp.org/rec/conf/usenix/TaranovBAH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/usenix/PlanetaBAHH21, author = {Maksym Planeta and Jan Bierbaum and Leo Sahaya Daphne Antony and Torsten Hoefler and Hermann H{\"{a}}rtig}, editor = {Irina Calciu and Geoff Kuenning}, title = {MigrOS: Transparent Live-Migration Support for Containerised {RDMA} Applications}, booktitle = {2021 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2021, July 14-16, 2021}, pages = {47--63}, publisher = {{USENIX} Association}, year = {2021}, url = {https://www.usenix.org/conference/atc21/presentation/planeta}, timestamp = {Thu, 12 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/usenix/PlanetaBAHH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uss/RothenbergerTPH21, author = {Benjamin Rothenberger and Konstantin Taranov and Adrian Perrig and Torsten Hoefler}, editor = {Michael D. Bailey and Rachel Greenstadt}, title = {ReDMArk: Bypassing {RDMA} Security Mechanisms}, booktitle = {30th {USENIX} Security Symposium, {USENIX} Security 2021, August 11-13, 2021}, pages = {4277--4292}, publisher = {{USENIX} Association}, year = {2021}, url = {https://www.usenix.org/conference/usenixsecurity21/presentation/rothenberger}, timestamp = {Mon, 20 Nov 2023 08:57:49 +0100}, biburl = {https://dblp.org/rec/conf/uss/RothenbergerTPH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-08734, author = {Roman B{\"{o}}hringer and Nikoli Dryden and Tal Ben{-}Nun and Torsten Hoefler}, title = {Clairvoyant Prefetching for Distributed Machine Learning {I/O}}, journal = {CoRR}, volume = {abs/2101.08734}, year = {2021}, url = {https://arxiv.org/abs/2101.08734}, eprinttype = {arXiv}, eprint = {2101.08734}, timestamp = {Sat, 30 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-08734.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-11030, author = {David Ittah and Thomas H{\"{a}}ner and Vadym Kliuchnikov and Torsten Hoefler}, title = {Enabling Dataflow Optimization for Quantum Programs}, journal = {CoRR}, volume = {abs/2101.11030}, year = {2021}, url = {https://arxiv.org/abs/2101.11030}, eprinttype = {arXiv}, eprint = {2101.11030}, timestamp = {Sun, 31 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-11030.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-00554, author = {Torsten Hoefler and Dan Alistarh and Tal Ben{-}Nun and Nikoli Dryden and Alexandra Peste}, title = {Sparsity in Deep Learning: Pruning and growth for efficient inference and training in neural networks}, journal = {CoRR}, volume = {abs/2102.00554}, year = {2021}, url = {https://arxiv.org/abs/2102.00554}, eprinttype = {arXiv}, eprint = {2102.00554}, timestamp = {Tue, 09 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-00554.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-03653, author = {Maciej Besta and Zur Vonarburg{-}Shmaria and Yannick Schaffner and Leonardo Schwarz and Grzegorz Kwasniewski and Lukas Gianinazzi and Jakub Ber{\'{a}}nek and Kacper Janda and Tobias Holenstein and Sebastian Leisinger and Peter Tatkowski and Esref {\"{O}}zdemir and Adrian Balla and Marcin Copik and Philipp Lindenberger and Pavel Kalvoda and Marek Konieczny and Onur Mutlu and Torsten Hoefler}, title = {GraphMineSuite: Enabling High-Performance and Programmable Graph Mining Algorithms with Set Algebra}, journal = {CoRR}, volume = {abs/2103.03653}, year = {2021}, url = {https://arxiv.org/abs/2103.03653}, eprinttype = {arXiv}, eprint = {2103.03653}, timestamp = {Fri, 27 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-03653.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-07582, author = {Maciej Besta and Raghavendra Kanakagiri and Grzegorz Kwasniewski and Rachata Ausavarungnirun and Jakub Ber{\'{a}}nek and Konstantinos Kanellopoulos and Kacper Janda and Zur Vonarburg{-}Shmaria and Lukas Gianinazzi and Ioana Stefan and Juan G{\'{o}}mez{-}Luna and Marcin Copik and Lukas Kapp{-}Schwoerer and Salvatore Di Girolamo and Marek Konieczny and Onur Mutlu and Torsten Hoefler}, title = {{SISA:} Set-Centric Instruction Set Architecture for Graph Mining on Processing-in-Memory Systems}, journal = {CoRR}, volume = {abs/2104.07582}, year = {2021}, url = {https://arxiv.org/abs/2104.07582}, eprinttype = {arXiv}, eprint = {2104.07582}, timestamp = {Tue, 20 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-07582.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-01109, author = {Thomas H{\"{a}}ner and Damian S. Steiger and Torsten Hoefler and Matthias Troyer}, title = {Distributed Quantum Computing with {QMPI}}, journal = {CoRR}, volume = {abs/2105.01109}, year = {2021}, url = {https://arxiv.org/abs/2105.01109}, eprinttype = {arXiv}, eprint = {2105.01109}, timestamp = {Fri, 14 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-01109.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-07203, author = {Grzegorz Kwasniewski and Tal Ben{-}Nun and Lukas Gianinazzi and Alexandru Calotoiu and Timo Schneider and Alexandros Nikolaos Ziogas and Maciej Besta and Torsten Hoefler}, title = {Pebbles, Graphs, and a Pinch of Combinatorics: Towards Tight {I/O} Lower Bounds for Statically Analyzable Programs}, journal = {CoRR}, volume = {abs/2105.07203}, year = {2021}, url = {https://arxiv.org/abs/2105.07203}, eprinttype = {arXiv}, eprint = {2105.07203}, timestamp = {Tue, 18 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-07203.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-12663, author = {Maciej Besta and Marcel Schneider and Salvatore Di Girolamo and Ankit Singla and Torsten Hoefler}, title = {Towards Million-Server Network Simulations on Just a Laptop}, journal = {CoRR}, volume = {abs/2105.12663}, year = {2021}, url = {https://arxiv.org/abs/2105.12663}, eprinttype = {arXiv}, eprint = {2105.12663}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-12663.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-00761, author = {Maciej Besta and Raphael Grob and Cesare Miglioli and Nicola Bernold and Grzegorz Kwasniewski and Gabriel Gjini and Raghavendra Kanakagiri and Saleh Ashkboos and Lukas Gianinazzi and Nikoli Dryden and Torsten Hoefler}, title = {Motif Prediction with Graph Neural Networks}, journal = {CoRR}, volume = {abs/2106.00761}, year = {2021}, url = {https://arxiv.org/abs/2106.00761}, eprinttype = {arXiv}, eprint = {2106.00761}, timestamp = {Wed, 09 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-00761.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-03594, author = {Lukas Gianinazzi and Maximilian Fries and Nikoli Dryden and Tal Ben{-}Nun and Maciej Besta and Torsten Hoefler}, title = {Learning Combinatorial Node Labeling Algorithms}, journal = {CoRR}, volume = {abs/2106.03594}, year = {2021}, url = {https://arxiv.org/abs/2106.03594}, eprinttype = {arXiv}, eprint = {2106.03594}, timestamp = {Thu, 15 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-03594.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-13859, author = {Marcin Copik and Konstantin Taranov and Alexandru Calotoiu and Torsten Hoefler}, title = {RFaaS: RDMA-Enabled FaaS Platform for Serverless High-Performance Computing}, journal = {CoRR}, volume = {abs/2106.13859}, year = {2021}, url = {https://arxiv.org/abs/2106.13859}, eprinttype = {arXiv}, eprint = {2106.13859}, timestamp = {Wed, 30 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-13859.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-15565, author = {Daniele De Sensi and Salvatore Di Girolamo and Saleh Ashkboos and Shigang Li and Torsten Hoefler}, title = {Flare: Flexible In-Network Allreduce}, journal = {CoRR}, volume = {abs/2106.15565}, year = {2021}, url = {https://arxiv.org/abs/2106.15565}, eprinttype = {arXiv}, eprint = {2106.15565}, timestamp = {Mon, 05 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-15565.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-00555, author = {Alexandros Nikolaos Ziogas and Timo Schneider and Tal Ben{-}Nun and Alexandru Calotoiu and Tiziano De Matteis and Johannes de Fine Licht and Luca Lavarini and Torsten Hoefler}, title = {Productivity, Portability, Performance: Data-Centric Python}, journal = {CoRR}, volume = {abs/2107.00555}, year = {2021}, url = {https://arxiv.org/abs/2107.00555}, eprinttype = {arXiv}, eprint = {2107.00555}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-00555.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-06925, author = {Shigang Li and Torsten H{\"{o}}fler}, title = {Chimera: Efficiently Training Large-Scale Neural Networks with Bidirectional Pipelines}, journal = {CoRR}, volume = {abs/2107.06925}, year = {2021}, url = {https://arxiv.org/abs/2107.06925}, eprinttype = {arXiv}, eprint = {2107.06925}, timestamp = {Wed, 21 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-06925.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-09337, author = {Grzegorz Kwasniewski and Marko Kabic and Tal Ben{-}Nun and Alexandros Nikolaos Ziogas and Jens Eirik Saethre and Andr{\'{e}} Gaillard and Timo Schneider and Maciej Besta and Anton Kozhevnikov and Joost VandeVondele and Torsten Hoefler}, title = {On the Parallel {I/O} Optimality of Linear Algebra Kernels: Near-Optimal Matrix Factorizations}, journal = {CoRR}, volume = {abs/2108.09337}, year = {2021}, url = {https://arxiv.org/abs/2108.09337}, eprinttype = {arXiv}, eprint = {2108.09337}, timestamp = {Fri, 27 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-09337.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-09663, author = {Lukas Gianinazzi and Maciej Besta and Yannick Schaffner and Torsten Hoefler}, title = {Parallel Algorithms for Finding Large Cliques in Sparse Graphs}, journal = {CoRR}, volume = {abs/2109.09663}, year = {2021}, url = {https://arxiv.org/abs/2109.09663}, eprinttype = {arXiv}, eprint = {2109.09663}, timestamp = {Mon, 27 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-09663.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-10802, author = {Oliver Rausch and Tal Ben{-}Nun and Nikoli Dryden and Andrei Ivanov and Shigang Li and Torsten Hoefler}, title = {A Data-Centric Optimization Framework for Machine Learning}, journal = {CoRR}, volume = {abs/2110.10802}, year = {2021}, url = {https://arxiv.org/abs/2110.10802}, eprinttype = {arXiv}, eprint = {2110.10802}, timestamp = {Thu, 28 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-10802.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2112-11879, author = {Alexandru Calotoiu and Tal Ben{-}Nun and Grzegorz Kwasniewski and Johannes de Fine Licht and Timo Schneider and Philipp Schaad and Torsten Hoefler}, title = {Lifting {C} Semantics for Dataflow Optimization}, journal = {CoRR}, volume = {abs/2112.11879}, year = {2021}, url = {https://arxiv.org/abs/2112.11879}, eprinttype = {arXiv}, eprint = {2112.11879}, timestamp = {Tue, 04 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2112-11879.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pacmpl/HanerHT20, author = {Thomas H{\"{a}}ner and Torsten Hoefler and Matthias Troyer}, title = {Assertion-based optimization of Quantum programs}, journal = {Proc. {ACM} Program. Lang.}, volume = {4}, number = {{OOPSLA}}, pages = {133:1--133:20}, year = {2020}, url = {https://doi.org/10.1145/3428201}, doi = {10.1145/3428201}, timestamp = {Wed, 17 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/pacmpl/HanerHT20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pacmpl/GrosserTFPKRSH20, author = {Tobias Grosser and Theodoros Theodoridis and Maximilian Falkenstein and Arjun Pitchanathan and Michael Kruse and Manuel Rigger and Zhendong Su and Torsten Hoefler}, title = {Fast linear programming through transprecision computing on small and sparse data}, journal = {Proc. {ACM} Program. Lang.}, volume = {4}, number = {{OOPSLA}}, pages = {195:1--195:28}, year = {2020}, url = {https://doi.org/10.1145/3428263}, doi = {10.1145/3428263}, timestamp = {Tue, 30 Nov 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/pacmpl/GrosserTFPKRSH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pc/TraffH20, author = {Jesper Larsson Tr{\"{a}}ff and Torsten Hoefler}, title = {Special issue: Selected papers from EuroMPI 2019}, journal = {Parallel Comput.}, volume = {99}, pages = {102695}, year = {2020}, url = {https://doi.org/10.1016/j.parco.2020.102695}, doi = {10.1016/J.PARCO.2020.102695}, timestamp = {Fri, 18 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/pc/TraffH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/superfri/OsunaWTHF20, author = {Carlos Osuna and Tobias Wicky and Fabian Thuering and Torsten Hoefler and Oliver Fuhrer}, title = {Dawn: a High-level Domain-Specific Language Compiler Toolchain for Weather and Climate Applications}, journal = {Supercomput. Front. Innov.}, volume = {7}, number = {2}, pages = {79--97}, year = {2020}, url = {https://doi.org/10.14529/jsfi200205}, doi = {10.14529/JSFI200205}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/superfri/OsunaWTHF20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tcad/KhanMGHC20, author = {Asif Ali Khan and Hauke Mewes and Tobias Grosser and Torsten Hoefler and Jer{\'{o}}nimo Castrill{\'{o}}n}, title = {Polyhedral Compilation for Racetrack Memories}, journal = {{IEEE} Trans. Comput. Aided Des. Integr. Circuits Syst.}, volume = {39}, number = {11}, pages = {3968--3980}, year = {2020}, url = {https://doi.org/10.1109/TCAD.2020.3012266}, doi = {10.1109/TCAD.2020.3012266}, timestamp = {Thu, 17 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tcad/KhanMGHC20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/trets/BestaFBSLH20, author = {Maciej Besta and Marc Fischer and Tal Ben{-}Nun and Dimitri Stanojevic and Johannes de Fine Licht and Torsten Hoefler}, title = {Substream-Centric Maximum Matchings on {FPGA}}, journal = {{ACM} Trans. Reconfigurable Technol. Syst.}, volume = {13}, number = {2}, pages = {8:1--8:33}, year = {2020}, url = {https://doi.org/10.1145/3377871}, doi = {10.1145/3377871}, timestamp = {Fri, 10 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/trets/BestaFBSLH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/HofferBHGHS20, author = {Elad Hoffer and Tal Ben{-}Nun and Itay Hubara and Niv Giladi and Torsten Hoefler and Daniel Soudry}, title = {Augment Your Batch: Improving Generalization Through Instance Repetition}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {8126--8135}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Hoffer\_Augment\_Your\_Batch\_Improving\_Generalization\_Through\_Instance\_Repetition\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.00815}, timestamp = {Tue, 31 Aug 2021 14:00:04 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/HofferBHGHS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dac/KurthRZHB20, author = {Andreas Kurth and Samuel Riedel and Florian Zaruba and Torsten Hoefler and Luca Benini}, title = {ATUNs: Modular and Scalable Support for Atomic Operations in a Shared Memory Multiprocessor}, booktitle = {57th {ACM/IEEE} Design Automation Conference, {DAC} 2020, San Francisco, CA, USA, July 20-24, 2020}, pages = {1--6}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/DAC18072.2020.9218661}, doi = {10.1109/DAC18072.2020.9218661}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/dac/KurthRZHB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/fpga/LichtKH20, author = {Johannes de Fine Licht and Grzegorz Kwasniewski and Torsten Hoefler}, editor = {Stephen Neuendorffer and Lesley Shannon}, title = {Flexible Communication Avoiding Matrix Multiplication on {FPGA} with High-Level Synthesis}, booktitle = {{FPGA} '20: The 2020 {ACM/SIGDA} International Symposium on Field-Programmable Gate Arrays, Seaside, CA, USA, February 23-25, 2020}, pages = {244--254}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3373087.3375296}, doi = {10.1145/3373087.3375296}, timestamp = {Sun, 25 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/fpga/LichtKH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/RitterCRRH020, author = {Marcus Ritter and Alexandru Calotoiu and Sebastian Rinke and Thorsten Reimann and Torsten Hoefler and Felix Wolf}, title = {Learning Cost-Effective Sampling Strategies for Empirical Performance Modeling}, booktitle = {2020 {IEEE} International Parallel and Distributed Processing Symposium (IPDPS), New Orleans, LA, USA, May 18-22, 2020}, pages = {884--895}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/IPDPS47924.2020.00095}, doi = {10.1109/IPDPS47924.2020.00095}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ipps/RitterCRRH020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/BestaKMKRHS20, author = {Maciej Besta and Raghavendra Kanakagiri and Harun Mustafa and Mikhail Karasikov and Gunnar R{\"{a}}tsch and Torsten Hoefler and Edgar Solomonik}, title = {Communication-Efficient Jaccard similarity for High-Performance Distributed Genome Comparisons}, booktitle = {2020 {IEEE} International Parallel and Distributed Processing Symposium (IPDPS), New Orleans, LA, USA, May 18-22, 2020}, pages = {1122--1132}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/IPDPS47924.2020.00118}, doi = {10.1109/IPDPS47924.2020.00118}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ipps/BestaKMKRHS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/LiBGAH20, author = {Shigang Li and Tal Ben{-}Nun and Salvatore Di Girolamo and Dan Alistarh and Torsten Hoefler}, editor = {Rajiv Gupta and Xipeng Shen}, title = {Taming unbalanced training workloads in deep learning with partial collective operations}, booktitle = {PPoPP '20: 25th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, San Diego, California, USA, February 22-26, 2020}, pages = {45--61}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3332466.3374528}, doi = {10.1145/3332466.3374528}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/LiBGAH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/JinWTHLZ20, author = {Yuyang Jin and Haojie Wang and Xiongchao Tang and Torsten Hoefler and Xu Liu and Jidong Zhai}, editor = {Rajiv Gupta and Xipeng Shen}, title = {Identifying scalability bottlenecks for large-scale parallel programs with graph analysis}, booktitle = {PPoPP '20: 25th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, San Diego, California, USA, February 22-26, 2020}, pages = {409--410}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3332466.3374518}, doi = {10.1145/3332466.3374518}, timestamp = {Sun, 12 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/JinWTHLZ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/NigayMSH20, author = {Alexandr Nigay and Lukas Mosimann and Timo Schneider and Torsten Hoefler}, editor = {Wesley Bland and Kathryn M. Mohror and Toni Pena}, title = {Communication and Timing Issues with {MPI} Virtualization}, booktitle = {EuroMPI/USA '20: 27th European {MPI} Users' Group Meeting, Virtual Meeting, Austin, TX, USA, September 21-24, 2020}, pages = {11--20}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3416315.3416317}, doi = {10.1145/3416315.3416317}, timestamp = {Tue, 25 Jul 2023 13:44:09 +0200}, biburl = {https://dblp.org/rec/conf/pvm/NigayMSH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaSKCHGSH20, author = {Maciej Besta and Marcel Schneider and Marek Konieczny and Karolina Cynk and Erik Henriksson and Salvatore Di Girolamo and Ankit Singla and Torsten Hoefler}, editor = {Christine Cuicchi and Irene Qualters and William T. Kramer}, title = {FatPaths: routing in supercomputers and data centers when shortest paths fall short}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2020, Virtual Event / Atlanta, Georgia, USA, November 9-19, 2020}, pages = {27}, publisher = {{IEEE/ACM}}, year = {2020}, url = {https://doi.org/10.1109/SC41405.2020.00031}, doi = {10.1109/SC41405.2020.00031}, timestamp = {Wed, 04 May 2022 13:02:27 +0200}, biburl = {https://dblp.org/rec/conf/sc/BestaSKCHGSH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/JinWYTH0Z20, author = {Yuyang Jin and Haojie Wang and Teng Yu and Xiongchao Tang and Torsten Hoefler and Xu Liu and Jidong Zhai}, editor = {Christine Cuicchi and Irene Qualters and William T. Kramer}, title = {ScalAna: automating scaling loss detection with graph analysis}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2020, Virtual Event / Atlanta, Georgia, USA, November 9-19, 2020}, pages = {28}, publisher = {{IEEE/ACM}}, year = {2020}, url = {https://doi.org/10.1109/SC41405.2020.00032}, doi = {10.1109/SC41405.2020.00032}, timestamp = {Mon, 01 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/JinWYTH0Z20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/SensiGMRH20, author = {Daniele De Sensi and Salvatore Di Girolamo and Kim H. McMahon and Duncan Roweth and Torsten Hoefler}, editor = {Christine Cuicchi and Irene Qualters and William T. Kramer}, title = {An in-depth analysis of the slingshot interconnect}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2020, Virtual Event / Atlanta, Georgia, USA, November 9-19, 2020}, pages = {35}, publisher = {{IEEE/ACM}}, year = {2020}, url = {https://doi.org/10.1109/SC41405.2020.00039}, doi = {10.1109/SC41405.2020.00039}, timestamp = {Mon, 01 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/SensiGMRH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/MatteisLH20, author = {Tiziano De Matteis and Johannes de Fine Licht and Torsten Hoefler}, editor = {Christine Cuicchi and Irene Qualters and William T. Kramer}, title = {fBLAS: streaming linear algebra on {FPGA}}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2020, Virtual Event / Atlanta, Georgia, USA, November 9-19, 2020}, pages = {59}, publisher = {{IEEE/ACM}}, year = {2020}, url = {https://doi.org/10.1109/SC41405.2020.00063}, doi = {10.1109/SC41405.2020.00063}, timestamp = {Sat, 09 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/MatteisLH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/CalotoiuGKR0HO020, author = {Alexandru Calotoiu and Markus Geisenhofer and Florian Kummer and Marcus Ritter and Jens Weber and Torsten Hoefler and Martin Oberlack and Felix Wolf}, title = {Empirical Modeling of Spatially Diverging Performance}, booktitle = {{IEEE/ACM} International Workshop on {HPC} User Support Tools and Workshop on Programming and Performance Visualization Tools, HUST/ProTools@SC 2020, Atlanta, GA, USA, November 18, 2020}, pages = {71--80}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/HUSTProtools51951.2020.00015}, doi = {10.1109/HUSTPROTOOLS51951.2020.00015}, timestamp = {Fri, 30 Apr 2021 12:35:39 +0200}, biburl = {https://dblp.org/rec/conf/sc/CalotoiuGKR0HO020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaCJVGH20, author = {Maciej Besta and Armon Carigiet and Kacper Janda and Zur Vonarburg{-}Shmaria and Lukas Gianinazzi and Torsten Hoefler}, editor = {Christine Cuicchi and Irene Qualters and William T. Kramer}, title = {High-performance parallel graph coloring with strong guarantees on work, depth, and quality}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2020, Virtual Event / Atlanta, Georgia, USA, November 9-19, 2020}, pages = {99}, publisher = {{IEEE/ACM}}, year = {2020}, url = {https://doi.org/10.1109/SC41405.2020.00103}, doi = {10.1109/SC41405.2020.00103}, timestamp = {Mon, 01 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/BestaCJVGH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/GianinazziH20, author = {Lukas Gianinazzi and Torsten Hoefler}, editor = {Christian Scheideler and Michael Spear}, title = {Parallel Planar Subgraph Isomorphism and Vertex Connectivity}, booktitle = {{SPAA} '20: 32nd {ACM} Symposium on Parallelism in Algorithms and Architectures, Virtual Event, USA, July 15-17, 2020}, pages = {269--280}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3350755.3400259}, doi = {10.1145/3350755.3400259}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/spaa/GianinazziH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/usenix/TaranovRPH20, author = {Konstantin Taranov and Benjamin Rothenberger and Adrian Perrig and Torsten Hoefler}, editor = {Ada Gavrilovska and Erez Zadok}, title = {sRDMA - Efficient NIC-based Authentication and Encryption for Remote Direct Memory Access}, booktitle = {2020 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2020, July 15-17, 2020}, pages = {691--704}, publisher = {{USENIX} Association}, year = {2020}, url = {https://www.usenix.org/conference/atc20/presentation/taranov}, timestamp = {Mon, 01 Feb 2021 08:43:25 +0100}, biburl = {https://dblp.org/rec/conf/usenix/TaranovRPH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:series/lncse/CalotoiuCHRS020, author = {Alexandru Calotoiu and Marcin Copik and Torsten Hoefler and Marcus Ritter and Sergei Shudler and Felix Wolf}, editor = {Hans{-}Joachim Bungartz and Severin Reiz and Benjamin Uekermann and Philipp Neumann and Wolfgang E. Nagel}, title = {ExtraPeak: Advanced Automatic Performance Modeling for {HPC} Applications}, booktitle = {Software for Exascale Computing - {SPPEXA} 2016-2019}, series = {Lecture Notes in Computational Science and Engineering}, volume = {136}, pages = {453--482}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-47956-5\_15}, doi = {10.1007/978-3-030-47956-5\_15}, timestamp = {Thu, 14 Oct 2021 08:45:21 +0200}, biburl = {https://dblp.org/rec/series/lncse/CalotoiuCHRS020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2001-01653, author = {Tobias Gysi and Tobias Grosser and Laurin Brandner and Torsten Hoefler}, title = {A Fast Analytical Model of Fully Associative Caches}, journal = {CoRR}, volume = {abs/2001.01653}, year = {2020}, url = {http://arxiv.org/abs/2001.01653}, eprinttype = {arXiv}, eprint = {2001.01653}, timestamp = {Fri, 10 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2001-01653.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2001-07747, author = {Robert Gerstenberger and Maciej Besta and Torsten Hoefler}, title = {Enabling Highly-Scalable Remote Memory Access Programming with {MPI-3} One Sided}, journal = {CoRR}, volume = {abs/2001.07747}, year = {2020}, url = {https://arxiv.org/abs/2001.07747}, eprinttype = {arXiv}, eprint = {2001.07747}, timestamp = {Fri, 24 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2001-07747.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-10143, author = {Florian Zaruba and Fabian Schuiki and Torsten Hoefler and Luca Benini}, title = {Snitch: {A} 10 kGE Pseudo Dual-Issue Processor for Area and Energy Efficient Execution of Floating-Point Intensive Workloads}, journal = {CoRR}, volume = {abs/2002.10143}, year = {2020}, url = {https://arxiv.org/abs/2002.10143}, eprinttype = {arXiv}, eprint = {2002.10143}, timestamp = {Tue, 03 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-10143.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-10536, author = {Chris Cummins and Zacharias V. Fisches and Tal Ben{-}Nun and Torsten Hoefler and Hugh Leather}, title = {ProGraML: Graph-based Deep Learning for Program Optimization and Analysis}, journal = {CoRR}, volume = {abs/2003.10536}, year = {2020}, url = {https://arxiv.org/abs/2003.10536}, eprinttype = {arXiv}, eprint = {2003.10536}, timestamp = {Wed, 01 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-10536.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-00124, author = {Shigang Li and Tal Ben{-}Nun and Dan Alistarh and Salvatore Di Girolamo and Nikoli Dryden and Torsten Hoefler}, title = {Breaking (Global) Barriers in Parallel Stochastic Optimization with Wait-Avoiding Group Averaging}, journal = {CoRR}, volume = {abs/2005.00124}, year = {2020}, url = {https://arxiv.org/abs/2005.00124}, eprinttype = {arXiv}, eprint = {2005.00124}, timestamp = {Fri, 08 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-00124.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-08748, author = {Peter Gr{\"{o}}nquist and Chengyuan Yao and Tal Ben{-}Nun and Nikoli Dryden and Peter Dueben and Shigang Li and Torsten Hoefler}, title = {Deep Learning for Post-Processing Ensemble Weather Forecasts}, journal = {CoRR}, volume = {abs/2005.08748}, year = {2020}, url = {https://arxiv.org/abs/2005.08748}, eprinttype = {arXiv}, eprint = {2005.08748}, timestamp = {Fri, 22 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-08748.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-13014, author = {Tobias Gysi and Christoph M{\"{u}}ller and Oleksandr Zinenko and Stephan Herhut and Eddie Davis and Tobias Wicky and Oliver Fuhrer and Torsten Hoefler and Tobias Grosser}, title = {Domain-Specific Multi-Level {IR} Rewriting for {GPU}}, journal = {CoRR}, volume = {abs/2005.13014}, year = {2020}, url = {https://arxiv.org/abs/2005.13014}, eprinttype = {arXiv}, eprint = {2005.13014}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-13014.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-10598, author = {Bryan A. Plummer and Nikoli Dryden and Julius Frost and Torsten Hoefler and Kate Saenko}, title = {Shapeshifter Networks: Cross-layer Parameter Sharing for Scalable and Effective Deep Learning}, journal = {CoRR}, volume = {abs/2006.10598}, year = {2020}, url = {https://arxiv.org/abs/2006.10598}, eprinttype = {arXiv}, eprint = {2006.10598}, timestamp = {Tue, 23 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-10598.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-00072, author = {Andrei Ivanov and Nikoli Dryden and Tal Ben{-}Nun and Shigang Li and Torsten Hoefler}, title = {Data Movement Is All You Need: {A} Case Study on Optimizing Transformers}, journal = {CoRR}, volume = {abs/2007.00072}, year = {2020}, url = {https://arxiv.org/abs/2007.00072}, eprinttype = {arXiv}, eprint = {2007.00072}, timestamp = {Mon, 06 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-00072.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-01199, author = {Lukas Gianinazzi and Torsten Hoefler}, title = {Parallel Planar Subgraph Isomorphism and Vertex Connectivity}, journal = {CoRR}, volume = {abs/2007.01199}, year = {2020}, url = {https://arxiv.org/abs/2007.01199}, eprinttype = {arXiv}, eprint = {2007.01199}, timestamp = {Mon, 06 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-01199.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-03776, author = {Maciej Besta and Jens Domke and Marcel Schneider and Marek Konieczny and Salvatore Di Girolamo and Timo Schneider and Ankit Singla and Torsten Hoefler}, title = {High-Performance Routing with Multipathing and Path Diversity in Supercomputers and Data Centers}, journal = {CoRR}, volume = {abs/2007.03776}, year = {2020}, url = {https://arxiv.org/abs/2007.03776}, eprinttype = {arXiv}, eprint = {2007.03776}, timestamp = {Mon, 20 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-03776.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-08886, author = {Daniele De Sensi and Salvatore Di Girolamo and Kim H. McMahon and Duncan Roweth and Torsten Hoefler}, title = {An In-Depth Analysis of the Slingshot Interconnect}, journal = {CoRR}, volume = {abs/2008.08886}, year = {2020}, url = {https://arxiv.org/abs/2008.08886}, eprinttype = {arXiv}, eprint = {2008.08886}, timestamp = {Fri, 21 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-08886.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-11321, author = {Maciej Besta and Armon Carigiet and Zur Vonarburg{-}Shmaria and Kacper Janda and Lukas Gianinazzi and Torsten Hoefler}, title = {High-Performance Parallel Graph Coloring with Strong Guarantees on Work, Depth, and Quality}, journal = {CoRR}, volume = {abs/2008.11321}, year = {2020}, url = {https://arxiv.org/abs/2008.11321}, eprinttype = {arXiv}, eprint = {2008.11321}, timestamp = {Fri, 28 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-11321.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-01692, author = {Yuyang Jin and Haojie Wang and Teng Yu and Xiongchao Tang and Torsten Hoefler and Xu Liu and Jidong Zhai}, title = {ScalAna: Automating Scaling Loss Detection with Graph Analysis}, journal = {CoRR}, volume = {abs/2009.01692}, year = {2020}, url = {https://arxiv.org/abs/2009.01692}, eprinttype = {arXiv}, eprint = {2009.01692}, timestamp = {Wed, 16 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-01692.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-06988, author = {Maksym Planeta and Jan Bierbaum and Leo Sahaya Daphne Antony and Torsten Hoefler and Hermann H{\"{a}}rtig}, title = {TardiS: Migrating Containers with {RDMA} Networks}, journal = {CoRR}, volume = {abs/2009.06988}, year = {2020}, url = {https://arxiv.org/abs/2009.06988}, eprinttype = {arXiv}, eprint = {2009.06988}, timestamp = {Fri, 18 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-06988.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-03536, author = {Salvatore Di Girolamo and Andreas Kurth and Alexandru Calotoiu and Thomas Benz and Timo Schneider and Jakub Ber{\'{a}}nek and Luca Benini and Torsten Hoefler}, title = {PsPIN: {A} high-performance low-power architecture for flexible in-network compute}, journal = {CoRR}, volume = {abs/2010.03536}, year = {2020}, url = {https://arxiv.org/abs/2010.03536}, eprinttype = {arXiv}, eprint = {2010.03536}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-03536.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-05975, author = {Grzegorz Kwasniewski and Tal Ben{-}Nun and Alexandros Nikolaos Ziogas and Timo Schneider and Maciej Besta and Torsten Hoefler}, title = {On the Parallel {I/O} Optimality of Linear Algebra Kernels: Near-Optimal {LU} Factorization}, journal = {CoRR}, volume = {abs/2010.05975}, year = {2020}, url = {https://arxiv.org/abs/2010.05975}, eprinttype = {arXiv}, eprint = {2010.05975}, timestamp = {Tue, 20 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-05975.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-09025, author = {Maciej Besta and Torsten Hoefler}, title = {Fault Tolerance for Remote Memory Access Programming Models}, journal = {CoRR}, volume = {abs/2010.09025}, year = {2020}, url = {https://arxiv.org/abs/2010.09025}, eprinttype = {arXiv}, eprint = {2010.09025}, timestamp = {Wed, 21 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-09025.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-09135, author = {Maciej Besta and Torsten Hoefler}, title = {Accelerating Irregular Computations with Hardware Transactional Memory and Active Messages}, journal = {CoRR}, volume = {abs/2010.09135}, year = {2020}, url = {https://arxiv.org/abs/2010.09135}, eprinttype = {arXiv}, eprint = {2010.09135}, timestamp = {Wed, 21 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-09135.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-09852, author = {Hermann Schweizer and Maciej Besta and Torsten Hoefler}, title = {Evaluating the Cost of Atomic Operations on Modern Architectures}, journal = {CoRR}, volume = {abs/2010.09852}, year = {2020}, url = {https://arxiv.org/abs/2010.09852}, eprinttype = {arXiv}, eprint = {2010.09852}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-09852.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-09854, author = {Patrick Schmid and Maciej Besta and Torsten Hoefler}, title = {High-Performance Distributed {RMA} Locks}, journal = {CoRR}, volume = {abs/2010.09854}, year = {2020}, url = {https://arxiv.org/abs/2010.09854}, eprinttype = {arXiv}, eprint = {2010.09854}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-09854.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-09913, author = {Maciej Besta and Florian Marending and Edgar Solomonik and Torsten Hoefler}, title = {SlimSell: {A} Vectorizable Graph Representation for Breadth-First Search}, journal = {CoRR}, volume = {abs/2010.09913}, year = {2020}, url = {https://arxiv.org/abs/2010.09913}, eprinttype = {arXiv}, eprint = {2010.09913}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-09913.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-10683, author = {Maciej Besta and Syed Minhaj Hassan and Sudhakar Yalamanchili and Rachata Ausavarungnirun and Onur Mutlu and Torsten Hoefler}, title = {Slim NoC: {A} Low-Diameter On-Chip Network Topology for High Energy Efficiency and Scalability}, journal = {CoRR}, volume = {abs/2010.10683}, year = {2020}, url = {https://arxiv.org/abs/2010.10683}, eprinttype = {arXiv}, eprint = {2010.10683}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-10683.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-12478, author = {Marcin Copik and Tobias Grosser and Torsten Hoefler and Paolo Bientinesi and Benjamin Berkels}, title = {Work-stealing prefix scan: Addressing load imbalance in large-scale image registration}, journal = {CoRR}, volume = {abs/2010.12478}, year = {2020}, url = {https://arxiv.org/abs/2010.12478}, eprinttype = {arXiv}, eprint = {2010.12478}, timestamp = {Tue, 27 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-12478.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-14684, author = {Maciej Besta and Marc Fischer and Tal Ben{-}Nun and Dimitri Stanojevic and Johannes de Fine Licht and Torsten Hoefler}, title = {Substream-Centric Maximum Matchings on {FPGA}}, journal = {CoRR}, volume = {abs/2010.14684}, year = {2020}, url = {https://arxiv.org/abs/2010.14684}, eprinttype = {arXiv}, eprint = {2010.14684}, timestamp = {Mon, 02 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-14684.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-15218, author = {Johannes de Fine Licht and Andreas Kuster and Tiziano De Matteis and Tal Ben{-}Nun and Dominic Hofer and Torsten Hoefler}, title = {StencilFlow: Mapping Large Stencil Programs to Distributed Spatial Computing Systems}, journal = {CoRR}, volume = {abs/2010.15218}, year = {2020}, url = {https://arxiv.org/abs/2010.15218}, eprinttype = {arXiv}, eprint = {2010.15218}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-15218.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-15879, author = {Maciej Besta and Dimitri Stanojevic and Tijana Zivic and Jagpreet Singh and Maurice Hoerold and Torsten Hoefler}, title = {Log(Graph): {A} Near-Optimal High-Performance Graph Representation}, journal = {CoRR}, volume = {abs/2010.15879}, year = {2020}, url = {https://arxiv.org/abs/2010.15879}, eprinttype = {arXiv}, eprint = {2010.15879}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-15879.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-16012, author = {Maciej Besta and Michal Podstawski and Linus Groner and Edgar Solomonik and Torsten Hoefler}, title = {To Push or To Pull: On Reducing Communication and Synchronization in Graph Computations}, journal = {CoRR}, volume = {abs/2010.16012}, year = {2020}, url = {https://arxiv.org/abs/2010.16012}, eprinttype = {arXiv}, eprint = {2010.16012}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-16012.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-07001, author = {Tal Ben{-}Nun and Lukas Gianinazzi and Torsten Hoefler and Yishai Oltchik}, title = {Parametric Graph Templates: Properties and Algorithms}, journal = {CoRR}, volume = {abs/2011.07001}, year = {2020}, url = {https://arxiv.org/abs/2011.07001}, eprinttype = {arXiv}, eprint = {2011.07001}, timestamp = {Wed, 18 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-07001.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-08070, author = {Paul Scheffler and Florian Zaruba and Fabian Schuiki and Torsten Hoefler and Luca Benini}, title = {Indirection Stream Semantic Register Architecture for Efficient Sparse-Dense Linear Algebra}, journal = {CoRR}, volume = {abs/2011.08070}, year = {2020}, url = {https://arxiv.org/abs/2011.08070}, eprinttype = {arXiv}, eprint = {2011.08070}, timestamp = {Wed, 18 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-08070.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-01470, author = {Chris Cummins and Hugh Leather and Zacharias V. Fisches and Tal Ben{-}Nun and Torsten Hoefler and Michael F. P. O'Boyle}, title = {Deep Data Flow Analysis}, journal = {CoRR}, volume = {abs/2012.01470}, year = {2020}, url = {https://arxiv.org/abs/2012.01470}, eprinttype = {arXiv}, eprint = {2012.01470}, timestamp = {Fri, 04 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-01470.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-14132, author = {Marcin Copik and Grzegorz Kwasniewski and Maciej Besta and Michal Podstawski and Torsten Hoefler}, title = {SeBS: {A} Serverless Benchmark Suite for Function-as-a-Service Computing}, journal = {CoRR}, volume = {abs/2012.14132}, year = {2020}, url = {https://arxiv.org/abs/2012.14132}, eprinttype = {arXiv}, eprint = {2012.14132}, timestamp = {Tue, 05 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-14132.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-15592, author = {Marcin Copik and Alexandru Calotoiu and Tobias Grosser and Nicolas Wicki and Felix Wolf and Torsten Hoefler}, title = {Extracting Clean Performance Models from Tainted Programs}, journal = {CoRR}, volume = {abs/2012.15592}, year = {2020}, url = {https://arxiv.org/abs/2012.15592}, eprinttype = {arXiv}, eprint = {2012.15592}, timestamp = {Fri, 08 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-15592.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/concurrency/YebenesEGQH19, author = {Pedro Y{\'{e}}benes and Jes{\'{u}}s Escudero{-}Sahuquillo and Pedro Javier Garc{\'{\i}}a and Francisco J. Quiles and Torsten Hoefler}, title = {Head-of-line blocking avoidance in Slim Fly networks using deadlock-free non-minimal and adaptive routing}, journal = {Concurr. Comput. Pract. Exp.}, volume = {31}, number = {2}, year = {2019}, url = {https://doi.org/10.1002/cpe.4441}, doi = {10.1002/CPE.4441}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/concurrency/YebenesEGQH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cse/SchulthessBWFHS19, author = {Thomas C. Schulthess and Peter Bauer and Nils Wedi and Oliver Fuhrer and Torsten Hoefler and Christoph M. Sch{\"{a}}r}, title = {Reflecting on the Goal and Baseline for Exascale Computing: {A} Roadmap Based on Weather and Climate Simulations}, journal = {Comput. Sci. Eng.}, volume = {21}, number = {1}, pages = {30--41}, year = {2019}, url = {https://doi.org/10.1109/MCSE.2018.2888788}, doi = {10.1109/MCSE.2018.2888788}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/cse/SchulthessBWFHS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/csur/Ben-NunH19, author = {Tal Ben{-}Nun and Torsten Hoefler}, title = {Demystifying Parallel and Distributed Deep Learning: An In-depth Concurrency Analysis}, journal = {{ACM} Comput. Surv.}, volume = {52}, number = {4}, pages = {65:1--65:43}, year = {2019}, url = {https://doi.org/10.1145/3320060}, doi = {10.1145/3320060}, timestamp = {Sat, 08 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/csur/Ben-NunH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pvldb/BarthelsMTAH19, author = {Claude Barthels and Ingo M{\"{u}}ller and Konstantin Taranov and Gustavo Alonso and Torsten Hoefler}, title = {Strong consistency is not hard to get: Two-Phase Locking and Two-Phase Commit on Thousands of Cores}, journal = {Proc. {VLDB} Endow.}, volume = {12}, number = {13}, pages = {2325--2338}, year = {2019}, url = {http://www.vldb.org/pvldb/vol12/p2325-barthels.pdf}, doi = {10.14778/3358701.3358702}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pvldb/BarthelsMTAH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/ShudlerBCHSW19, author = {Sergei Shudler and Yannick Berens and Alexandru Calotoiu and Torsten Hoefler and Alexandre Strube and Felix Wolf}, title = {Engineering Algorithms for Scalability through Continuous Validation of Performance Expectations}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {30}, number = {8}, pages = {1768--1785}, year = {2019}, url = {https://doi.org/10.1109/TPDS.2019.2896993}, doi = {10.1109/TPDS.2019.2896993}, timestamp = {Fri, 02 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tpds/ShudlerBCHSW19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/GysiGH19, author = {Tobias Gysi and Tobias Grosser and Torsten Hoefler}, title = {Absinthe: Learning an Analytical Performance Model to Fuse and Tile Stencil Codes in One Shot}, booktitle = {28th International Conference on Parallel Architectures and Compilation Techniques, {PACT} 2019, Seattle, WA, USA, September 23-26, 2019}, pages = {370--382}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/PACT.2019.00036}, doi = {10.1109/PACT.2019.00036}, timestamp = {Wed, 13 Nov 2019 18:02:12 +0100}, biburl = {https://dblp.org/rec/conf/IEEEpact/GysiGH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dac/GleinigHH19, author = {Niels Gleinig and Frances Ann Hubis and Torsten Hoefler}, title = {Embedding Functions Into Reversible Circuits: {A} Probabilistic Approach to the Number of Lines}, booktitle = {Proceedings of the 56th Annual Design Automation Conference 2019, {DAC} 2019, Las Vegas, NV, USA, June 02-06, 2019}, pages = {72}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3316781.3317814}, doi = {10.1145/3316781.3317814}, timestamp = {Sun, 08 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/dac/GleinigHH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/fpga/BestaFBLH19, author = {Maciej Besta and Marc Fischer and Tal Ben{-}Nun and Johannes de Fine Licht and Torsten Hoefler}, editor = {Kia Bazargan and Stephen Neuendorffer}, title = {Substream-Centric Maximum Matchings on {FPGA}}, booktitle = {Proceedings of the 2019 {ACM/SIGDA} International Symposium on Field-Programmable Gate Arrays, {FPGA} 2019, Seaside, CA, USA, February 24-26, 2019}, pages = {152--161}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3289602.3293916}, doi = {10.1145/3289602.3293916}, timestamp = {Sun, 25 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/fpga/BestaFBLH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/EllerHG19, author = {Paul R. Eller and Torsten Hoefler and William Gropp}, editor = {Rudolf Eigenmann and Chen Ding and Sally A. McKee}, title = {Using performance models to understand scalable Krylov solver performance at scale for structured grid problems}, booktitle = {Proceedings of the {ACM} International Conference on Supercomputing, {ICS} 2019, Phoenix, AZ, USA, June 26-28, 2019}, pages = {138--149}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3330345.3330358}, doi = {10.1145/3330345.3330358}, timestamp = {Tue, 28 Jul 2020 07:46:43 +0200}, biburl = {https://dblp.org/rec/conf/ics/EllerHG19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/Ben-NunBHZPH19, author = {Tal Ben{-}Nun and Maciej Besta and Simon Huber and Alexandros Nikolaos Ziogas and Daniel Peter and Torsten Hoefler}, title = {A Modular Benchmarking Infrastructure for High-Performance and Reproducible Deep Learning}, booktitle = {2019 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2019, Rio de Janeiro, Brazil, May 20-24, 2019}, pages = {66--77}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/IPDPS.2019.00018}, doi = {10.1109/IPDPS.2019.00018}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/ipps/Ben-NunBHZPH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/Hoefler19, author = {Torsten Hoefler}, title = {Invited Talk 2}, booktitle = {{IEEE} International Parallel and Distributed Processing Symposium Workshops, {IPDPSW} 2019, Rio de Janeiro, Brazil, May 20-24, 2019}, pages = {392}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/IPDPSW.2019.00074}, doi = {10.1109/IPDPSW.2019.00074}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/ipps/Hoefler19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/GirolamoSSH19, author = {Salvatore Di Girolamo and Pirmin Schmid and Thomas C. Schulthess and Torsten Hoefler}, title = {SimFS: {A} Simulation Data Virtualizing File System Interface}, booktitle = {2019 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2019, Rio de Janeiro, Brazil, May 20-24, 2019}, pages = {621--630}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/IPDPS.2019.00071}, doi = {10.1109/IPDPS.2019.00071}, timestamp = {Mon, 09 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ipps/GirolamoSSH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pasc/ThalerMOBVAMFSH19, author = {Felix Thaler and Stefan Moosbrugger and Carlos Osuna and Mauro Bianco and Hannes Vogt and Anton Afanasyev and Lukas Mosimann and Oliver Fuhrer and Thomas C. Schulthess and Torsten Hoefler}, title = {Porting the {COSMO} Weather Model to Manycore CPUs}, booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference, {PASC} 2019, Zurich, Switzerland, June 12-14, 2019}, pages = {13:1--13:11}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3324989.3325723}, doi = {10.1145/3324989.3325723}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pasc/ThalerMOBVAMFSH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pldi/GysiGBH19, author = {Tobias Gysi and Tobias Grosser and Laurin Brandner and Torsten Hoefler}, editor = {Kathryn S. McKinley and Kathleen Fisher}, title = {A fast analytical model of fully associative caches}, booktitle = {Proceedings of the 40th {ACM} {SIGPLAN} Conference on Programming Language Design and Implementation, {PLDI} 2019, Phoenix, AZ, USA, June 22-26, 2019}, pages = {816--829}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3314221.3314606}, doi = {10.1145/3314221.3314606}, timestamp = {Sun, 09 Jun 2019 18:52:19 +0200}, biburl = {https://dblp.org/rec/conf/pldi/GysiGBH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/KuttlerPBWHBH19, author = {Martin K{\"{u}}ttler and Maksym Planeta and Jan Bierbaum and Carsten Weinhold and Hermann H{\"{a}}rtig and Amnon Barak and Torsten Hoefler}, editor = {Jeffrey K. Hollingsworth and Idit Keidar}, title = {Corrected trees for reliable group communication}, booktitle = {Proceedings of the 24th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, PPoPP 2019, Washington, DC, USA, February 16-20, 2019}, pages = {287--299}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3293883.3295721}, doi = {10.1145/3293883.3295721}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/KuttlerPBWHBH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/TraffH19, author = {Jesper Larsson Tr{\"{a}}ff and Torsten Hoefler}, editor = {Torsten Hoefler and Jesper Larsson Tr{\"{a}}ff}, title = {Foreword EuroMPI 2019}, booktitle = {Proceedings of the 26th European {MPI} Users' Group Meeting, EuroMPI 2019, Z{\"{u}}rich, Switzerland, September 11-13, 2019}, pages = {1:1--1:2}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3343211.3343212}, doi = {10.1145/3343211.3343212}, timestamp = {Wed, 11 Sep 2019 12:26:40 +0200}, biburl = {https://dblp.org/rec/conf/pvm/TraffH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/ZiogasBFSLH19, author = {Alexandros Nikolaos Ziogas and Tal Ben{-}Nun and Guillermo Indalecio Fern{\'{a}}ndez and Timo Schneider and Mathieu Luisier and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {A data-centric approach to extreme-scale \emph{ab initio} dissipative quantum transport simulations}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {1:1--1:13}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3357156}, doi = {10.1145/3295500.3357156}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/ZiogasBFSLH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/RenggliAAAH19, author = {C{\'{e}}dric Renggli and Saleh Ashkboos and Mehdi Aghagolzadeh and Dan Alistarh and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {SparCML: high-performance sparse communication for machine learning}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {11:1--11:15}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356222}, doi = {10.1145/3295500.3356222}, timestamp = {Sat, 09 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/RenggliAAAH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/SensiGH19, author = {Daniele De Sensi and Salvatore Di Girolamo and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Mitigating network noise on Dragonfly networks through application-aware routing}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {16:1--16:32}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356196}, doi = {10.1145/3295500.3356196}, timestamp = {Sat, 09 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/SensiGH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/KwasniewskiKBVS19, author = {Grzegorz Kwasniewski and Marko Kabic and Maciej Besta and Joost VandeVondele and Raffaele Solc{\`{a}} and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Red-blue pebbling revisited: near optimal parallel matrix-matrix multiplication}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {24:1--24:22}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356181}, doi = {10.1145/3295500.3356181}, timestamp = {Sun, 06 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/KwasniewskiKBVS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaWGGIOH19, author = {Maciej Besta and Simon Weber and Lukas Gianinazzi and Robert Gerstenberger and Andrey Ivanov and Yishai Oltchik and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Slim graph: practical lossy graph compression for approximate graph processing, storage, and analytics}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {35:1--35:25}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356182}, doi = {10.1145/3295500.3356182}, timestamp = {Wed, 10 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/BestaWGGIOH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/GirolamoTKSSBBB19, author = {Salvatore Di Girolamo and Konstantin Taranov and Andreas Kurth and Michael Schaffner and Timo Schneider and Jakub Ber{\'{a}}nek and Maciej Besta and Luca Benini and Duncan Roweth and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Network-accelerated non-contiguous memory transfers}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {56:1--56:14}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356189}, doi = {10.1145/3295500.3356189}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/GirolamoTKSSBBB19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/ZiogasBFSLH19a, author = {Alexandros Nikolaos Ziogas and Tal Ben{-}Nun and Guillermo Indalecio Fern{\'{a}}ndez and Timo Schneider and Mathieu Luisier and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Optimizing the data movement in quantum transport simulations via data-centric parallel programming}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {78:1--78:17}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356200}, doi = {10.1145/3295500.3356200}, timestamp = {Sat, 09 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/ZiogasBFSLH19a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/Ben-NunLZSH19, author = {Tal Ben{-}Nun and Johannes de Fine Licht and Alexandros Nikolaos Ziogas and Timo Schneider and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Stateful dataflow multigraphs: a data-centric model for performance portability on heterogeneous architectures}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {81:1--81:14}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356173}, doi = {10.1145/3295500.3356173}, timestamp = {Sun, 25 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/Ben-NunLZSH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/MatteisLBH19, author = {Tiziano De Matteis and Johannes de Fine Licht and Jakub Ber{\'{a}}nek and Torsten Hoefler}, editor = {Michela Taufer and Pavan Balaji and Antonio J. Pe{\~{n}}a}, title = {Streaming message interface: high-performance distributed memory programming on reconfigurable hardware}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2019, Denver, Colorado, USA, November 17-19, 2019}, pages = {82:1--82:33}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3295500.3356201}, doi = {10.1145/3295500.3356201}, timestamp = {Sat, 09 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/MatteisLBH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/pvm/2019, editor = {Torsten Hoefler and Jesper Larsson Tr{\"{a}}ff}, title = {Proceedings of the 26th European {MPI} Users' Group Meeting, EuroMPI 2019, Z{\"{u}}rich, Switzerland, September 11-13, 2019}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3343211}, doi = {10.1145/3343211}, isbn = {978-1-4503-7175-9}, timestamp = {Wed, 11 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/2019.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-09335, author = {Elad Hoffer and Tal Ben{-}Nun and Itay Hubara and Niv Giladi and Torsten Hoefler and Daniel Soudry}, title = {Augment your batch: better training with larger batches}, journal = {CoRR}, volume = {abs/1901.09335}, year = {2019}, url = {http://arxiv.org/abs/1901.09335}, eprinttype = {arXiv}, eprint = {1901.09335}, timestamp = {Sat, 02 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-09335.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-10183, author = {Tal Ben{-}Nun and Maciej Besta and Simon Huber and Alexandros Nikolaos Ziogas and Daniel Peter and Torsten Hoefler}, title = {A Modular Benchmarking Infrastructure for High-Performance and Reproducible Deep Learning}, journal = {CoRR}, volume = {abs/1901.10183}, year = {2019}, url = {http://arxiv.org/abs/1901.10183}, eprinttype = {arXiv}, eprint = {1901.10183}, timestamp = {Sat, 02 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-10183.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-03154, author = {Salvatore Di Girolamo and Pirmin Schmid and Thomas C. Schulthess and Torsten Hoefler}, title = {SimFS: {A} Simulation Data Virtualizing File System Interface}, journal = {CoRR}, volume = {abs/1902.03154}, year = {2019}, url = {http://arxiv.org/abs/1902.03154}, eprinttype = {arXiv}, eprint = {1902.03154}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-03154.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-10345, author = {Tal Ben{-}Nun and Johannes de Fine Licht and Alexandros Nikolaos Ziogas and Timo Schneider and Torsten Hoefler}, title = {Stateful Dataflow Multigraphs: {A} Data-Centric Model for High-Performance Parallel Programs}, journal = {CoRR}, volume = {abs/1902.10345}, year = {2019}, url = {http://arxiv.org/abs/1902.10345}, eprinttype = {arXiv}, eprint = {1902.10345}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-10345.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1903-06697, author = {Maciej Besta and Dimitri Stanojevic and Johannes de Fine Licht and Tal Ben{-}Nun and Torsten Hoefler}, title = {Graph Processing on FPGAs: Taxonomy, Survey, Challenges}, journal = {CoRR}, volume = {abs/1903.06697}, year = {2019}, url = {http://arxiv.org/abs/1903.06697}, eprinttype = {arXiv}, eprint = {1903.06697}, timestamp = {Mon, 01 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1903-06697.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-10885, author = {Maciej Besta and Marcel Schneider and Karolina Cynk and Marek Konieczny and Erik Henriksson and Salvatore Di Girolamo and Ankit Singla and Torsten Hoefler}, title = {FatPaths: Routing in Supercomputers, Data Centers, and Clouds with Low-Diameter Networks when Shortest Paths Fall Short}, journal = {CoRR}, volume = {abs/1906.10885}, year = {2019}, url = {http://arxiv.org/abs/1906.10885}, eprinttype = {arXiv}, eprint = {1906.10885}, timestamp = {Thu, 27 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-10885.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-07929, author = {Tiziano De Matteis and Johannes de Fine Licht and Torsten Hoefler}, title = {{FBLAS:} Streaming Linear Algebra on {FPGA}}, journal = {CoRR}, volume = {abs/1907.07929}, year = {2019}, url = {http://arxiv.org/abs/1907.07929}, eprinttype = {arXiv}, eprint = {1907.07929}, timestamp = {Tue, 23 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-07929.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-04207, author = {Shigang Li and Tal Ben{-}Nun and Salvatore Di Girolamo and Dan Alistarh and Torsten Hoefler}, title = {Taming Unbalanced Training Workloads in Deep Learning with Partial Collective Operations}, journal = {CoRR}, volume = {abs/1908.04207}, year = {2019}, url = {http://arxiv.org/abs/1908.04207}, eprinttype = {arXiv}, eprint = {1908.04207}, timestamp = {Mon, 19 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-04207.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-08590, author = {Salvatore Di Girolamo and Konstantin Taranov and Andreas Kurth and Michael Schaffner and Timo Schneider and Jakub Ber{\'{a}}nek and Maciej Besta and Luca Benini and Duncan Roweth and Torsten Hoefler}, title = {Network-Accelerated Non-Contiguous Memory Transfers}, journal = {CoRR}, volume = {abs/1908.08590}, year = {2019}, url = {http://arxiv.org/abs/1908.08590}, eprinttype = {arXiv}, eprint = {1908.08590}, timestamp = {Mon, 26 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-08590.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-08986, author = {Elad Hoffer and Berry Weinstein and Itay Hubara and Tal Ben{-}Nun and Torsten Hoefler and Daniel Soudry}, title = {Mix {\&} Match: training convnets with mixed image sizes for improved accuracy, speed and scale resiliency}, journal = {CoRR}, volume = {abs/1908.08986}, year = {2019}, url = {http://arxiv.org/abs/1908.08986}, eprinttype = {arXiv}, eprint = {1908.08986}, timestamp = {Thu, 29 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-08986.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-09606, author = {Grzegorz Kwasniewski and Marko Kabic and Maciej Besta and Joost VandeVondele and Raffaele Solc{\`{a}} and Torsten Hoefler}, title = {Red-blue pebbling revisited: near optimal parallel matrix-matrix multiplication}, journal = {CoRR}, volume = {abs/1908.09606}, year = {2019}, url = {http://arxiv.org/abs/1908.09606}, eprinttype = {arXiv}, eprint = {1908.09606}, timestamp = {Thu, 29 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-09606.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-03231, author = {Tiziano De Matteis and Johannes de Fine Licht and Jakub Ber{\'{a}}nek and Torsten Hoefler}, title = {Streaming Message Interface: High-Performance Distributed Memory Programming on Reconfigurable Hardware}, journal = {CoRR}, volume = {abs/1909.03231}, year = {2019}, url = {http://arxiv.org/abs/1909.03231}, eprinttype = {arXiv}, eprint = {1909.03231}, timestamp = {Tue, 17 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-03231.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-07865, author = {Daniele De Sensi and Salvatore Di Girolamo and Torsten Hoefler}, title = {Mitigating Network Noise on Dragonfly Networks through Application-Aware Routing}, journal = {CoRR}, volume = {abs/1909.07865}, year = {2019}, url = {http://arxiv.org/abs/1909.07865}, eprinttype = {arXiv}, eprint = {1909.07865}, timestamp = {Tue, 24 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-07865.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-04436, author = {Johannes de Fine Licht and Torsten Hoefler}, title = {hlslib: Software Engineering for Hardware Design}, journal = {CoRR}, volume = {abs/1910.04436}, year = {2019}, url = {http://arxiv.org/abs/1910.04436}, eprinttype = {arXiv}, eprint = {1910.04436}, timestamp = {Wed, 16 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-04436.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-09017, author = {Maciej Besta and Emanuel Peter and Robert Gerstenberger and Marc Fischer and Michal Podstawski and Claude Barthels and Gustavo Alonso and Torsten Hoefler}, title = {Demystifying Graph Databases: Analysis and Taxonomy of Data Organization, System Designs, and Graph Queries}, journal = {CoRR}, volume = {abs/1910.09017}, year = {2019}, url = {http://arxiv.org/abs/1910.09017}, eprinttype = {arXiv}, eprint = {1910.09017}, timestamp = {Tue, 22 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-09017.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-12897, author = {Maciej Besta and Torsten Hoefler}, title = {Active Access: {A} Mechanism for High-Performance Distributed Data-Centric Computations}, journal = {CoRR}, volume = {abs/1910.12897}, year = {2019}, url = {http://arxiv.org/abs/1910.12897}, eprinttype = {arXiv}, eprint = {1910.12897}, timestamp = {Thu, 31 Oct 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-12897.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-00630, author = {Peter Gr{\"{o}}nquist and Tal Ben{-}Nun and Nikoli Dryden and Peter Dueben and Luca Lavarini and Shigang Li and Torsten Hoefler}, title = {Predicting Weather Uncertainty with Deep Convnets}, journal = {CoRR}, volume = {abs/1911.00630}, year = {2019}, url = {http://arxiv.org/abs/1911.00630}, eprinttype = {arXiv}, eprint = {1911.00630}, timestamp = {Mon, 11 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-00630.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-04200, author = {Maciej Besta and Raghavendra Kanakagiri and Harun Mustafa and Mikhail Karasikov and Gunnar R{\"{a}}tsch and Torsten Hoefler and Edgar Solomonik}, title = {Communication-Efficient Jaccard Similarity for High-Performance Distributed Genome Comparisons}, journal = {CoRR}, volume = {abs/1911.04200}, year = {2019}, url = {http://arxiv.org/abs/1911.04200}, eprinttype = {arXiv}, eprint = {1911.04200}, timestamp = {Sun, 01 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-04200.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-08356, author = {Fabian Schuiki and Florian Zaruba and Torsten Hoefler and Luca Benini}, title = {Stream Semantic Registers: {A} Lightweight {RISC-V} {ISA} Extension Achieving Full Compute Utilization in Single-Issue Cores}, journal = {CoRR}, volume = {abs/1911.08356}, year = {2019}, url = {http://arxiv.org/abs/1911.08356}, eprinttype = {arXiv}, eprint = {1911.08356}, timestamp = {Mon, 02 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-08356.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-06526, author = {Johannes de Fine Licht and Grzegorz Kwasniewski and Torsten Hoefler}, title = {Flexible Communication Avoiding Matrix Multiplication on {FPGA} with High-Level Synthesis}, journal = {CoRR}, volume = {abs/1912.06526}, year = {2019}, url = {http://arxiv.org/abs/1912.06526}, eprinttype = {arXiv}, eprint = {1912.06526}, timestamp = {Thu, 02 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-06526.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-08810, author = {Alexandros Nikolaos Ziogas and Tal Ben{-}Nun and Guillermo Indalecio Fern{\'{a}}ndez and Timo Schneider and Mathieu Luisier and Torsten Hoefler}, title = {Optimizing the Data Movement in Quantum Transport Simulations via Data-Centric Parallel Programming}, journal = {CoRR}, volume = {abs/1912.08810}, year = {2019}, url = {http://arxiv.org/abs/1912.08810}, eprinttype = {arXiv}, eprint = {1912.08810}, timestamp = {Fri, 03 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-08810.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-08950, author = {Maciej Besta and Simon Weber and Lukas Gianinazzi and Robert Gerstenberger and Andrey Ivanov and Yishai Oltchik and Torsten Hoefler}, title = {Slim Graph: Practical Lossy Graph Compression for Approximate Graph Processing, Storage, and Analytics}, journal = {CoRR}, volume = {abs/1912.08950}, year = {2019}, url = {http://arxiv.org/abs/1912.08950}, eprinttype = {arXiv}, eprint = {1912.08950}, timestamp = {Wed, 10 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-08950.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-08968, author = {Maciej Besta and Torsten Hoefler}, title = {Slim Fly: {A} Cost Effective Low-Diameter Network Topology}, journal = {CoRR}, volume = {abs/1912.08968}, year = {2019}, url = {http://arxiv.org/abs/1912.08968}, eprinttype = {arXiv}, eprint = {1912.08968}, timestamp = {Fri, 03 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-08968.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-10024, author = {Alexandros Nikolaos Ziogas and Tal Ben{-}Nun and Guillermo Indalecio Fern{\'{a}}ndez and Timo Schneider and Mathieu Luisier and Torsten Hoefler}, title = {A Data-Centric Approach to Extreme-Scale Ab initio Dissipative Quantum Transport Simulations}, journal = {CoRR}, volume = {abs/1912.10024}, year = {2019}, url = {http://arxiv.org/abs/1912.10024}, eprinttype = {arXiv}, eprint = {1912.10024}, timestamp = {Fri, 03 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-10024.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-12740, author = {Maciej Besta and Marc Fischer and Vasiliki Kalavri and Michael Kapralov and Torsten Hoefler}, title = {Practice of Streaming and Dynamic Graphs: Concepts, Models, Systems, and Parallelism}, journal = {CoRR}, volume = {abs/1912.12740}, year = {2019}, url = {http://arxiv.org/abs/1912.12740}, eprinttype = {arXiv}, eprint = {1912.12740}, timestamp = {Sat, 04 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-12740.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cacm/GerstenbergerBH18, author = {Robert Gerstenberger and Maciej Besta and Torsten Hoefler}, title = {Enabling highly scalable remote memory access programming with {MPI-3} one sided}, journal = {Commun. {ACM}}, volume = {61}, number = {10}, pages = {106--113}, year = {2018}, url = {https://doi.org/10.1145/3264413}, doi = {10.1145/3264413}, timestamp = {Wed, 21 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/cacm/GerstenbergerBH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/LiZH18, author = {Shigang Li and Yunquan Zhang and Torsten Hoefler}, title = {Cache-Oblivious {MPI} All-to-All Communications Based on Morton Order}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {29}, number = {3}, pages = {542--555}, year = {2018}, url = {https://doi.org/10.1109/TPDS.2017.2768413}, doi = {10.1109/TPDS.2017.2768413}, timestamp = {Fri, 02 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tpds/LiZH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/BestaSZSHH18, author = {Maciej Besta and Dimitri Stanojevic and Tijana Zivic and Jagpreet Singh and Maurice Hoerold and Torsten Hoefler}, editor = {Skevos Evripidou and Per Stenstr{\"{o}}m and Michael F. P. O'Boyle}, title = {Log(graph): a near-optimal high-performance graph representation}, booktitle = {Proceedings of the 27th International Conference on Parallel Architectures and Compilation Techniques, {PACT} 2018, Limassol, Cyprus, November 01-04, 2018}, pages = {7:1--7:13}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3243176.3243198}, doi = {10.1145/3243176.3243198}, timestamp = {Wed, 21 Nov 2018 12:44:10 +0100}, biburl = {https://dblp.org/rec/conf/IEEEpact/BestaSZSHH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asplos/BestaHYAMH18, author = {Maciej Besta and Syed Minhaj Hassan and Sudhakar Yalamanchili and Rachata Ausavarungnirun and Onur Mutlu and Torsten Hoefler}, editor = {Xipeng Shen and James Tuck and Ricardo Bianchini and Vivek Sarkar}, title = {Slim NoC: {A} Low-Diameter On-Chip Network Topology for High Energy Efficiency and Scalability}, booktitle = {Proceedings of the Twenty-Third International Conference on Architectural Support for Programming Languages and Operating Systems, {ASPLOS} 2018, Williamsburg, VA, USA, March 24-28, 2018}, pages = {43--55}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3173162.3177158}, doi = {10.1145/3173162.3177158}, timestamp = {Tue, 23 Jan 2024 20:31:22 +0100}, biburl = {https://dblp.org/rec/conf/asplos/BestaHYAMH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cluster/CalotoiuGHLR018, author = {Alexandru Calotoiu and Alexander Graf and Torsten Hoefler and Daniel Lorenz and Sebastian Rinke and Felix Wolf}, title = {Lightweight Requirements Engineering for Exascale Co-design}, booktitle = {{IEEE} International Conference on Cluster Computing, {CLUSTER} 2018, Belfast, UK, September 10-13, 2018}, pages = {201--211}, publisher = {{IEEE} Computer Society}, year = {2018}, url = {https://doi.org/10.1109/CLUSTER.2018.00038}, doi = {10.1109/CLUSTER.2018.00038}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cluster/CalotoiuGHLR018.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cluster/OyamaBHM18, author = {Yosuke Oyama and Tal Ben{-}Nun and Torsten Hoefler and Satoshi Matsuoka}, title = {Accelerating Deep Learning Frameworks with Micro-Batches}, booktitle = {{IEEE} International Conference on Cluster Computing, {CLUSTER} 2018, Belfast, UK, September 10-13, 2018}, pages = {402--412}, publisher = {{IEEE} Computer Society}, year = {2018}, url = {https://doi.org/10.1109/CLUSTER.2018.00058}, doi = {10.1109/CLUSTER.2018.00058}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cluster/OyamaBHM18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eurosys/TaranovAH18, author = {Konstantin Taranov and Gustavo Alonso and Torsten Hoefler}, editor = {Rui Oliveira and Pascal Felber and Y. Charlie Hu}, title = {Fast and strongly-consistent per-item resilience in key-value stores}, booktitle = {Proceedings of the Thirteenth EuroSys Conference, EuroSys 2018, Porto, Portugal, April 23-26, 2018}, pages = {39:1--39:14}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3190508.3190536}, doi = {10.1145/3190508.3190536}, timestamp = {Thu, 23 Jun 2022 19:57:07 +0200}, biburl = {https://dblp.org/rec/conf/eurosys/TaranovAH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icde/0002AHA18, author = {Ingo M{\"{u}}ller and Andrea Arteaga and Torsten Hoefler and Gustavo Alonso}, title = {Reproducible Floating-Point Aggregation in RDBMSs}, booktitle = {34th {IEEE} International Conference on Data Engineering, {ICDE} 2018, Paris, France, April 16-19, 2018}, pages = {1049--1060}, publisher = {{IEEE} Computer Society}, year = {2018}, url = {https://doi.org/10.1109/ICDE.2018.00098}, doi = {10.1109/ICDE.2018.00098}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icde/0002AHA18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Ben-NunJH18, author = {Tal Ben{-}Nun and Alice Shoshana Jakobovits and Torsten Hoefler}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Neural Code Comprehension: {A} Learnable Representation of Code Semantics}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {3589--3601}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/17c3433fecc21b57000debdf7ad5c930-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/Ben-NunJH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/AlistarhH0KKR18, author = {Dan Alistarh and Torsten Hoefler and Mikael Johansson and Nikola Konstantinov and Sarit Khirirat and C{\'{e}}dric Renggli}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {The Convergence of Sparsified Gradient Methods}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {5977--5987}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/314450613369e0ee72d0da7f6fee773c-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/AlistarhH0KKR18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/GianinazziKPBH18, author = {Lukas Gianinazzi and Pavel Kalvoda and Alessandro De Palma and Maciej Besta and Torsten Hoefler}, editor = {Andreas Krall and Thomas R. Gross}, title = {Communication-avoiding parallel minimum cuts and connected components}, booktitle = {Proceedings of the 23rd {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, PPoPP 2018, Vienna, Austria, February 24-28, 2018}, pages = {219--232}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3178487.3178504}, doi = {10.1145/3178487.3178504}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/GianinazziKPBH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/LichtBH18, author = {Johannes de Fine Licht and Michaela Blott and Torsten Hoefler}, editor = {Andreas Krall and Thomas R. Gross}, title = {Designing scalable {FPGA} architectures using high-level synthesis}, booktitle = {Proceedings of the 23rd {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, PPoPP 2018, Vienna, Austria, February 24-28, 2018}, pages = {403--404}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3178487.3178527}, doi = {10.1145/3178487.3178527}, timestamp = {Sun, 12 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/LichtBH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/LinZYTXCZHMLZX18, author = {Heng Lin and Xiaowei Zhu and Bowen Yu and Xiongchao Tang and Wei Xue and Wenguang Chen and Lufei Zhang and Torsten Hoefler and Xiaosong Ma and Xin Liu and Weimin Zheng and Jingfang Xu}, title = {ShenTu: processing multi-trillion edge graphs on millions of cores in seconds}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage, and Analysis, {SC} 2018, Dallas, TX, USA, November 11-16, 2018}, pages = {56:1--56:11}, publisher = {{IEEE} / {ACM}}, year = {2018}, url = {http://dl.acm.org/citation.cfm?id=3291731}, timestamp = {Mon, 24 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/LinZYTXCZHMLZX18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/vmcai/BaumannDMHV18, author = {Cedric Baumann and Andrei Marian Dan and Yuri Meshman and Torsten Hoefler and Martin T. Vechev}, editor = {Isil Dillig and Jens Palsberg}, title = {Automatic Verification of {RMA} Programs via Abstraction Extrapolation}, booktitle = {Verification, Model Checking, and Abstract Interpretation - 19th International Conference, {VMCAI} 2018, Los Angeles, CA, USA, January 7-9, 2018, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {10747}, pages = {47--70}, publisher = {Springer}, year = {2018}, url = {https://doi.org/10.1007/978-3-319-73721-8\_3}, doi = {10.1007/978-3-319-73721-8\_3}, timestamp = {Tue, 14 May 2019 10:00:43 +0200}, biburl = {https://dblp.org/rec/conf/vmcai/BaumannDMHV18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-08021, author = {C{\'{e}}dric Renggli and Dan Alistarh and Torsten Hoefler}, title = {SparCML: High-Performance Sparse Communication for Machine Learning}, journal = {CoRR}, volume = {abs/1802.08021}, year = {2018}, url = {http://arxiv.org/abs/1802.08021}, eprinttype = {arXiv}, eprint = {1802.08021}, timestamp = {Sun, 16 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-08021.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-09883, author = {Ingo M{\"{u}}ller and Andrea Arteaga and Torsten Hoefler and Gustavo Alonso}, title = {Reproducible Floating-Point Aggregation in RDBMSs}, journal = {CoRR}, volume = {abs/1802.09883}, year = {2018}, url = {http://arxiv.org/abs/1802.09883}, eprinttype = {arXiv}, eprint = {1802.09883}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-09883.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-09941, author = {Tal Ben{-}Nun and Torsten Hoefler}, title = {Demystifying Parallel and Distributed Deep Learning: An In-Depth Concurrency Analysis}, journal = {CoRR}, volume = {abs/1802.09941}, year = {2018}, url = {http://arxiv.org/abs/1802.09941}, eprinttype = {arXiv}, eprint = {1802.09941}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-09941.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1804-04806, author = {Yosuke Oyama and Tal Ben{-}Nun and Torsten Hoefler and Satoshi Matsuoka}, title = {{\(\mu\)}-cuDNN: Accelerating Deep Learning Frameworks with Micro-Batching}, journal = {CoRR}, volume = {abs/1804.04806}, year = {2018}, url = {http://arxiv.org/abs/1804.04806}, eprinttype = {arXiv}, eprint = {1804.04806}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1804-04806.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1805-08288, author = {Johannes de Fine Licht and Maciej Besta and Simon Meierhans and Torsten Hoefler}, title = {Transformations of High-Level Synthesis Codes for High-Performance Computing}, journal = {CoRR}, volume = {abs/1805.08288}, year = {2018}, url = {http://arxiv.org/abs/1805.08288}, eprinttype = {arXiv}, eprint = {1805.08288}, timestamp = {Wed, 16 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1805-08288.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-01799, author = {Maciej Besta and Torsten Hoefler}, title = {Survey and Taxonomy of Lossless Graph Compression and Space-Efficient Graph Representations}, journal = {CoRR}, volume = {abs/1806.01799}, year = {2018}, url = {http://arxiv.org/abs/1806.01799}, eprinttype = {arXiv}, eprint = {1806.01799}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-01799.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-07336, author = {Tal Ben{-}Nun and Alice Shoshana Jakobovits and Torsten Hoefler}, title = {Neural Code Comprehension: {A} Learnable Representation of Code Semantics}, journal = {CoRR}, volume = {abs/1806.07336}, year = {2018}, url = {http://arxiv.org/abs/1806.07336}, eprinttype = {arXiv}, eprint = {1806.07336}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-07336.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-10505, author = {Dan Alistarh and Torsten Hoefler and Mikael Johansson and Sarit Khirirat and Nikola Konstantinov and C{\'{e}}dric Renggli}, title = {The Convergence of Sparsified Gradient Methods}, journal = {CoRR}, volume = {abs/1809.10505}, year = {2018}, url = {http://arxiv.org/abs/1809.10505}, eprinttype = {arXiv}, eprint = {1809.10505}, timestamp = {Sun, 16 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-10505.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-00375, author = {Thomas H{\"{a}}ner and Torsten Hoefler and Matthias Troyer}, title = {Using Hoare logic for quantum circuit optimization}, journal = {CoRR}, volume = {abs/1810.00375}, year = {2018}, url = {http://arxiv.org/abs/1810.00375}, eprinttype = {arXiv}, eprint = {1810.00375}, timestamp = {Thu, 01 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-00375.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/debu/BarthelsAH17, author = {Claude Barthels and Gustavo Alonso and Torsten Hoefler}, title = {Designing Databases for Future High-Performance Networks}, journal = {{IEEE} Data Eng. Bull.}, volume = {40}, number = {1}, pages = {15--26}, year = {2017}, url = {http://sites.computer.org/debull/A17mar/p15.pdf}, timestamp = {Tue, 10 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/debu/BarthelsAH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pvldb/BarthelsAHSM17, author = {Claude Barthels and Gustavo Alonso and Torsten Hoefler and Timo Schneider and Ingo M{\"{u}}ller}, title = {Distributed Join Algorithms on Thousands of Cores}, journal = {Proc. {VLDB} Endow.}, volume = {10}, number = {5}, pages = {517--528}, year = {2017}, url = {http://www.vldb.org/pvldb/vol10/p517-barthels.pdf}, doi = {10.14778/3055540.3055545}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pvldb/BarthelsAHSM17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/UnatDHSABCCEFFH17, author = {Didem Unat and Anshu Dubey and Torsten Hoefler and John Shalf and Mark James Abraham and Mauro Bianco and Bradford L. Chamberlain and Romain Cledat and H. Carter Edwards and Hal Finkel and Karl Fuerlinger and Frank Hannig and Emmanuel Jeannot and Amir Kamil and Jeff Keasler and Paul H. J. Kelly and Vitus J. Leung and Hatem Ltaief and Naoya Maruyama and Chris J. Newburn and Miquel Peric{\`{a}}s}, title = {Trends in Data Locality Abstractions for {HPC} Systems}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {28}, number = {10}, pages = {3007--3020}, year = {2017}, url = {https://doi.org/10.1109/TPDS.2017.2703149}, doi = {10.1109/TPDS.2017.2703149}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tpds/UnatDHSABCCEFFH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ciac/FoersterGHKSW17, author = {Klaus{-}Tycho Foerster and Linus Groner and Torsten Hoefler and Michael K{\"{o}}nig and Sascha Schmid and Roger Wattenhofer}, editor = {Dimitris Fotakis and Aris Pagourtzis and Vangelis Th. Paschos}, title = {Multi-agent Pathfinding with n Agents on Graphs with n Vertices: Combinatorial Classification and Tight Algorithmic Bounds}, booktitle = {Algorithms and Complexity - 10th International Conference, {CIAC} 2017, Athens, Greece, May 24-26, 2017, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {10236}, pages = {247--259}, year = {2017}, url = {https://doi.org/10.1007/978-3-319-57586-5\_21}, doi = {10.1007/978-3-319-57586-5\_21}, timestamp = {Mon, 30 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ciac/FoersterGHKSW17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/YebenesEG0H17, author = {Pedro Y{\'{e}}benes and Jes{\'{u}}s Escudero{-}Sahuquillo and Pedro Javier Garc{\'{\i}}a and Francisco J. Quiles and Torsten Hoefler}, title = {Improving Non-minimal and Adaptive Routing Algorithms in Slim Fly Networks}, booktitle = {25th {IEEE} Annual Symposium on High-Performance Interconnects, {HOTI} 2017, Santa Clara, CA, USA, August 28-30, 2017}, pages = {1--8}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/HOTI.2017.11}, doi = {10.1109/HOTI.2017.11}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/YebenesEG0H17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/SchneiderDFUH17, author = {Timo Schneider and James Dinan and Mario Flajslik and Keith D. Underwood and Torsten Hoefler}, title = {Fast Networks and Slow Memories: {A} Mechanism for Mitigating Bandwidth Mismatches}, booktitle = {25th {IEEE} Annual Symposium on High-Performance Interconnects, {HOTI} 2017, Santa Clara, CA, USA, August 28-30, 2017}, pages = {17--24}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/HOTI.2017.17}, doi = {10.1109/HOTI.2017.17}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/SchneiderDFUH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpca/YebenesEG0H17, author = {Pedro Y{\'{e}}benes and Jes{\'{u}}s Escudero{-}Sahuquillo and Pedro Javier Garc{\'{\i}}a and Francisco J. Quiles and Torsten Hoefler}, editor = {Jes{\'{u}}s Escudero{-}Sahuquillo and Pedro Javier Garc{\'{\i}}a}, title = {An Effective Queuing Scheme to Provide Slim Fly Topologies with HoL Blocking Reduction and Deadlock Freedom for Minimal-Path Routing}, booktitle = {3rd {IEEE} International Workshop on High-Performance Interconnection Networks in the Exascale and Big-Data Era, HiPINEB@HPCA 2017, Austin, TX, USA, February 5, 2017}, pages = {25--32}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/HiPINEB.2017.9}, doi = {10.1109/HIPINEB.2017.9}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpca/YebenesEG0H17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/BestaPGSH17, author = {Maciej Besta and Michal Podstawski and Linus Groner and Edgar Solomonik and Torsten Hoefler}, editor = {H. Howie Huang and Jon B. Weissman and Adriana Iamnitchi and Alexandru Iosup}, title = {To Push or To Pull: On Reducing Communication and Synchronization in Graph Computations}, booktitle = {Proceedings of the 26th International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2017, Washington, DC, USA, June 26-30, 2017}, pages = {93--104}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3078597.3078616}, doi = {10.1145/3078597.3078616}, timestamp = {Tue, 06 Nov 2018 11:07:20 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/BestaPGSH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/PokeHG17, author = {Marius Poke and Torsten Hoefler and Colin W. Glass}, editor = {H. Howie Huang and Jon B. Weissman and Adriana Iamnitchi and Alexandru Iosup}, title = {AllConcur: Leaderless Concurrent Atomic Broadcast}, booktitle = {Proceedings of the 26th International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2017, Washington, DC, USA, June 26-30, 2017}, pages = {205--218}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3078597.3078598}, doi = {10.1145/3078597.3078598}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/PokeHG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccS/ArteagaFHS17, author = {Andrea Arteaga and Oliver Fuhrer and Torsten Hoefler and Thomas C. Schulthess}, editor = {Petros Koumoutsakos and Michael Lees and Valeria V. Krzhizhanovskaya and Jack J. Dongarra and Peter M. A. Sloot}, title = {Model-Driven Choice of Numerical Methods for the Solution of the Linear Advection Equation}, booktitle = {International Conference on Computational Science, {ICCS} 2017, 12-14 June 2017, Zurich, Switzerland}, series = {Procedia Computer Science}, volume = {108}, pages = {1542--1551}, publisher = {Elsevier}, year = {2017}, url = {https://doi.org/10.1016/j.procs.2017.05.208}, doi = {10.1016/J.PROCS.2017.05.208}, timestamp = {Thu, 08 Jul 2021 16:04:01 +0200}, biburl = {https://dblp.org/rec/conf/iccS/ArteagaFHS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/BestaMSH17, author = {Maciej Besta and Florian Marending and Edgar Solomonik and Torsten Hoefler}, title = {SlimSell: {A} Vectorizable Graph Representation for Breadth-First Search}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2017, Orlando, FL, USA, May 29 - June 2, 2017}, pages = {32--41}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPS.2017.93}, doi = {10.1109/IPDPS.2017.93}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/BestaMSH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/RamosH17, author = {Sabela Ramos and Torsten Hoefler}, title = {Capability Models for Manycore Memory Systems: {A} Case-Study with Xeon Phi {KNL}}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2017, Orlando, FL, USA, May 29 - June 2, 2017}, pages = {297--306}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPS.2017.30}, doi = {10.1109/IPDPS.2017.30}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/RamosH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerBSD17, author = {Torsten Hoefler and Amnon Barak and Amnon Shiloh and Zvi Drezner}, title = {Corrected Gossip Algorithms for Fast Reliable Broadcast on Unreliable Systems}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2017, Orlando, FL, USA, May 29 - June 2, 2017}, pages = {357--366}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPS.2017.36}, doi = {10.1109/IPDPS.2017.36}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerBSD17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/WickySH17, author = {Tobias Wicky and Edgar Solomonik and Torsten Hoefler}, title = {Communication-Avoiding Parallel Algorithms for Solving Triangular Systems of Linear Equations}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2017, Orlando, FL, USA, May 29 - June 2, 2017}, pages = {678--687}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPS.2017.104}, doi = {10.1109/IPDPS.2017.104}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/WickySH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/GirolamoVH17, author = {Salvatore Di Girolamo and Flavio Vella and Torsten Hoefler}, title = {Transparent Caching for {RMA} Systems}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2017, Orlando, FL, USA, May 29 - June 2, 2017}, pages = {1018--1027}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPS.2017.92}, doi = {10.1109/IPDPS.2017.92}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/GirolamoVH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/SongH17, author = {Shuaiwen Leon Song and Torsten Hoefler}, title = {{IPDRM} Workshop Introduction}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium Workshops, {IPDPS} Workshops 2017, Orlando / Buena Vista, FL, USA, May 29 - June 2, 2017}, pages = {1284}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPSW.2017.184}, doi = {10.1109/IPDPSW.2017.184}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/SongH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/Hoefler17, author = {Torsten Hoefler}, title = {{EMBRACE} Keynote}, booktitle = {2017 {IEEE} International Parallel and Distributed Processing Symposium Workshops, {IPDPS} Workshops 2017, Orlando / Buena Vista, FL, USA, May 29 - June 2, 2017}, pages = {1558}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.1109/IPDPSW.2017.220}, doi = {10.1109/IPDPSW.2017.220}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/Hoefler17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/ShudlerCHW17, author = {Sergei Shudler and Alexandru Calotoiu and Torsten Hoefler and Felix Wolf}, editor = {Vivek Sarkar and Lawrence Rauchwerger}, title = {Isoefficiency in Practice: Configuring and Understanding the Performance of Task-based Applications}, booktitle = {Proceedings of the 22nd {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, Austin, TX, USA, February 4-8, 2017}, pages = {131--143}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3018743.3018770}, doi = {10.1145/3018743.3018770}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/ShudlerCHW17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/0002ZH17, author = {Shigang Li and Yunquan Zhang and Torsten Hoefler}, editor = {Vivek Sarkar and Lawrence Rauchwerger}, title = {{POSTER:} Cache-Oblivious {MPI} All-to-All Communications on Many-Core Architectures}, booktitle = {Proceedings of the 22nd {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, Austin, TX, USA, February 4-8, 2017}, pages = {445--446}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3018743.3019025}, doi = {10.1145/3018743.3019025}, timestamp = {Sun, 12 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/0002ZH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/SolomonikBVH17, author = {Edgar Solomonik and Maciej Besta and Flavio Vella and Torsten Hoefler}, editor = {Bernd Mohr and Padma Raghavan}, title = {Scaling betweenness centrality using communication-efficient sparse matrix multiplication}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2017, Denver, CO, USA, November 12 - 17, 2017}, pages = {47}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3126908.3126971}, doi = {10.1145/3126908.3126971}, timestamp = {Tue, 08 Nov 2022 16:03:02 +0100}, biburl = {https://dblp.org/rec/conf/sc/SolomonikBVH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerGTGB17, author = {Torsten Hoefler and Salvatore Di Girolamo and Konstantin Taranov and Ryan E. Grant and Ron Brightwell}, editor = {Bernd Mohr and Padma Raghavan}, title = {sPIN: high-performance streaming processing in the network}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2017, Denver, CO, USA, November 12 - 17, 2017}, pages = {59}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3126908.3126970}, doi = {10.1145/3126908.3126970}, timestamp = {Tue, 08 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/HoeflerGTGB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/SolomonikBDH17, author = {Edgar Solomonik and Grey Ballard and James Demmel and Torsten Hoefler}, editor = {Christian Scheideler and Mohammad Taghi Hajiaghayi}, title = {A Communication-Avoiding Parallel Algorithm for the Symmetric Eigenvalue Problem}, booktitle = {Proceedings of the 29th {ACM} Symposium on Parallelism in Algorithms and Architectures, {SPAA} 2017, Washington DC, USA, July 24-26, 2017}, pages = {111--121}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3087556.3087561}, doi = {10.1145/3087556.3087561}, timestamp = {Sun, 25 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/spaa/SolomonikBDH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/hpdc/2017ross, editor = {Torsten Hoefler and Kamil Iskra}, title = {Proceedings of the 7th International Workshop on Runtime and Operating Systems for Supercomputers, ROSS@HPDC 2017, Washingon, DC, DC, USA, June 27 - 27, 2017}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3095770}, doi = {10.1145/3095770}, isbn = {978-1-4503-5086-0}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/2017ross.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SolomonikDH17, author = {Edgar Solomonik and James Demmel and Torsten Hoefler}, title = {Communication Lower Bounds of Bilinear Algorithms for Symmetric Tensor Contractions}, journal = {CoRR}, volume = {abs/1707.04618}, year = {2017}, url = {http://arxiv.org/abs/1707.04618}, eprinttype = {arXiv}, eprint = {1707.04618}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SolomonikDH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-05483, author = {Torsten Hoefler and Salvatore Di Girolamo and Konstantin Taranov and Ryan E. Grant and Ron Brightwell}, title = {sPIN: High-performance streaming Processing in the Network}, journal = {CoRR}, volume = {abs/1709.05483}, year = {2017}, url = {http://arxiv.org/abs/1709.05483}, eprinttype = {arXiv}, eprint = {1709.05483}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-05483.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijhpca/WidenerLFH16, author = {Patrick M. Widener and Scott Levy and Kurt B. Ferreira and Torsten Hoefler}, title = {On noise and the performance benefit of nonblocking collectives}, journal = {Int. J. High Perform. Comput. Appl.}, volume = {30}, number = {1}, pages = {121--133}, year = {2016}, url = {https://doi.org/10.1177/1094342015611952}, doi = {10.1177/1094342015611952}, timestamp = {Sun, 12 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ijhpca/WidenerLFH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/micro/GirolamoJUH16, author = {Salvatore Di Girolamo and Pierre Jolivet and Keith D. Underwood and Torsten Hoefler}, title = {Exploiting Offload-Enabled Network Interfaces}, journal = {{IEEE} Micro}, volume = {36}, number = {4}, pages = {6--17}, year = {2016}, url = {https://doi.org/10.1109/MM.2016.56}, doi = {10.1109/MM.2016.56}, timestamp = {Sat, 20 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/micro/GirolamoJUH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tpds/RamosH16, author = {Sabela Ramos and Torsten Hoefler}, title = {Cache Line Aware Algorithm Design for Cache-Coherent Architectures}, journal = {{IEEE} Trans. Parallel Distributed Syst.}, volume = {27}, number = {10}, pages = {2824--2837}, year = {2016}, url = {https://doi.org/10.1109/TPDS.2016.2516540}, doi = {10.1109/TPDS.2016.2516540}, timestamp = {Fri, 02 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tpds/RamosH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cluster/CalotoiuBEHKSW16, author = {Alexandru Calotoiu and David Beckingsale and Christopher W. Earl and Torsten Hoefler and Ian Karlin and Martin Schulz and Felix Wolf}, title = {Fast Multi-parameter Performance Modeling}, booktitle = {2016 {IEEE} International Conference on Cluster Computing, {CLUSTER} 2016, Taipei, Taiwan, September 12-16, 2016}, pages = {172--181}, publisher = {{IEEE} Computer Society}, year = {2016}, url = {https://doi.org/10.1109/CLUSTER.2016.57}, doi = {10.1109/CLUSTER.2016.57}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cluster/CalotoiuBEHKSW16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/SchneiderBH16, author = {Timo Schneider and Otto Bibartiu and Torsten Hoefler}, title = {Ensuring Deadlock-Freedom in Low-Diameter InfiniBand Networks}, booktitle = {24th {IEEE} Annual Symposium on High-Performance Interconnects, {HOTI} 2016, Santa Clara, CA, USA, August 24-26, 2016}, pages = {1--8}, publisher = {{IEEE} Computer Society}, year = {2016}, url = {https://doi.org/10.1109/HOTI.2016.015}, doi = {10.1109/HOTI.2016.015}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/SchneiderBH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/DomkeHM16, author = {Jens Domke and Torsten Hoefler and Satoshi Matsuoka}, editor = {Hiroshi Nakashima and Kenjiro Taura and Jack Lange}, title = {Routing on the Dependency Graph: {A} New Approach to Deadlock-Free High-Performance Routing}, booktitle = {Proceedings of the 25th {ACM} International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2016, Kyoto, Japan, May 31 - June 04, 2016}, pages = {3--14}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2907294.2907313}, doi = {10.1145/2907294.2907313}, timestamp = {Tue, 06 Nov 2018 11:07:21 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/DomkeHM16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/SchmidBH16, author = {Patrick Schmid and Maciej Besta and Torsten Hoefler}, editor = {Hiroshi Nakashima and Kenjiro Taura and Jack Lange}, title = {High-Performance Distributed {RMA} Locks}, booktitle = {Proceedings of the 25th {ACM} International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2016, Kyoto, Japan, May 31 - June 04, 2016}, pages = {19--30}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2907294.2907323}, doi = {10.1145/2907294.2907323}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/SchmidBH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icccn/SasakiPLHP16, author = {Takayuki Sasaki and Christos Pappas and Taeho Lee and Torsten Hoefler and Adrian Perrig}, title = {SDNsec: Forwarding Accountability for the {SDN} Data Plane}, booktitle = {25th International Conference on Computer Communication and Networks, {ICCCN} 2016, Waikoloa, HI, USA, August 1-4, 2016}, pages = {1--10}, publisher = {{IEEE}}, year = {2016}, url = {https://doi.org/10.1109/ICCCN.2016.7568569}, doi = {10.1109/ICCCN.2016.7568569}, timestamp = {Thu, 12 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icccn/SasakiPLHP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/GrosserH16, author = {Tobias Grosser and Torsten Hoefler}, editor = {Ozcan Ozturk and Kemal Ebcioglu and Mahmut T. Kandemir and Onur Mutlu}, title = {Polly-ACC Transparent compilation to heterogeneous hardware}, booktitle = {Proceedings of the 2016 International Conference on Supercomputing, {ICS} 2016, Istanbul, Turkey, June 1-3, 2016}, pages = {1:1--1:13}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2925426.2926286}, doi = {10.1145/2925426.2926286}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/GrosserH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/oopsla/DanLHV16, author = {Andrei Marian Dan and Patrick Lam and Torsten Hoefler and Martin T. Vechev}, editor = {Eelco Visser and Yannis Smaragdakis}, title = {Modeling and analysis of remote memory access programming}, booktitle = {Proceedings of the 2016 {ACM} {SIGPLAN} International Conference on Object-Oriented Programming, Systems, Languages, and Applications, {OOPSLA} 2016, part of {SPLASH} 2016, Amsterdam, The Netherlands, October 30 - November 4, 2016}, pages = {129--144}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2983990.2984033}, doi = {10.1145/2983990.2984033}, timestamp = {Wed, 23 Jun 2021 15:34:31 +0200}, biburl = {https://dblp.org/rec/conf/oopsla/DanLHV16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pasc/Hoefler16, author = {Torsten Hoefler}, editor = {Torsten Hoefler and David E. Keyes and Timothy Robinson}, title = {Selecting Technical Papers for an Interdisciplinary Conference: The {PASC} Review Process}, booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference, {PASC} 2016, Lausanne, Switzerland, June 8-10, 2016}, pages = {13}, publisher = {{ACM}}, year = {2016}, url = {http://dl.acm.org/citation.cfm?id=2970926}, timestamp = {Tue, 06 Nov 2018 11:07:28 +0100}, biburl = {https://dblp.org/rec/conf/pasc/Hoefler16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/DomkeH16, author = {Jens Domke and Torsten Hoefler}, editor = {John West and Cherri M. Pancake}, title = {Scheduling-aware routing for supercomputers}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2016, Salt Lake City, UT, USA, November 13-18, 2016}, pages = {142--153}, publisher = {{IEEE} Computer Society}, year = {2016}, url = {https://doi.org/10.1109/SC.2016.12}, doi = {10.1109/SC.2016.12}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/DomkeH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/TangWEKHIMWORW16, author = {William M. Tang and Bei Wang and St{\'{e}}phane Ethier and Grzegorz Kwasniewski and Torsten Hoefler and Khaled Z. Ibrahim and Kamesh Madduri and Samuel Williams and Leonid Oliker and Carlos Rosales{-}Fernandez and Timothy J. Williams}, editor = {John West and Cherri M. Pancake}, title = {Extreme scale plasma turbulence simulations on top supercomputers worldwide}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2016, Salt Lake City, UT, USA, November 13-18, 2016}, pages = {502--513}, publisher = {{IEEE} Computer Society}, year = {2016}, url = {https://doi.org/10.1109/SC.2016.42}, doi = {10.1109/SC.2016.42}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/TangWEKHIMWORW16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/GysiBH16, author = {Tobias Gysi and Jeremia B{\"{a}}r and Torsten Hoefler}, editor = {John West and Cherri M. Pancake}, title = {dCUDA: hardware supported overlap of computation and communication}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2016, Salt Lake City, UT, USA, November 13-18, 2016}, pages = {609--620}, publisher = {{IEEE} Computer Society}, year = {2016}, url = {https://doi.org/10.1109/SC.2016.51}, doi = {10.1109/SC.2016.51}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/GysiBH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/MartinassoKASH16, author = {Maxime Martinasso and Grzegorz Kwasniewski and Sadaf R. Alam and Thomas C. Schulthess and Torsten Hoefler}, editor = {John West and Cherri M. Pancake}, title = {A PCIe congestion-aware performance model for densely populated accelerator servers}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2016, Salt Lake City, UT, USA, November 13-18, 2016}, pages = {739--749}, publisher = {{IEEE} Computer Society}, year = {2016}, url = {https://doi.org/10.1109/SC.2016.62}, doi = {10.1109/SC.2016.62}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/MartinassoKASH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:series/lncse/WolfBCHIKMSSVW16, author = {Felix Wolf and Christian H. Bischof and Alexandru Calotoiu and Torsten Hoefler and Christian Iwainsky and Grzegorz Kwasniewski and Bernd Mohr and Sergei Shudler and Alexandre Strube and Andreas Vogel and Gabriel Wittum}, editor = {Hans{-}Joachim Bungartz and Philipp Neumann and Wolfgang E. Nagel}, title = {Automatic Performance Modeling of {HPC} Applications}, booktitle = {Software for Exascale Computing - {SPPEXA} 2013-2015}, series = {Lecture Notes in Computational Science and Engineering}, volume = {113}, pages = {445--465}, publisher = {Springer}, year = {2016}, url = {https://doi.org/10.1007/978-3-319-40528-5\_20}, doi = {10.1007/978-3-319-40528-5\_20}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/series/lncse/WolfBCHIKMSSVW16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/hpdc/2016ross, editor = {Kamil Iskra and Torsten Hoefler}, title = {Proceedings of the 6th International Workshop on Runtime and Operating Systems for Supercomputers, Kyoto, Japan, June 1, 2016}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2931088}, doi = {10.1145/2931088}, isbn = {978-1-4503-4387-9}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/2016ross.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/pasc/2016, editor = {Torsten Hoefler and David E. Keyes and Timothy Robinson}, title = {Proceedings of the Platform for Advanced Scientific Computing Conference, {PASC} 2016, Lausanne, Switzerland, June 8-10, 2016}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2929908}, doi = {10.1145/2929908}, isbn = {978-1-4503-4126-4}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/pasc/2016.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SolomonikBDH16, author = {Edgar Solomonik and Grey Ballard and James Demmel and Torsten Hoefler}, title = {A communication-avoiding parallel algorithm for the symmetric eigenvalue problem}, journal = {CoRR}, volume = {abs/1604.03703}, year = {2016}, url = {http://arxiv.org/abs/1604.03703}, eprinttype = {arXiv}, eprint = {1604.03703}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SolomonikBDH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SasakiPLHP16, author = {Takayuki Sasaki and Christos Pappas and Taeho Lee and Torsten Hoefler and Adrian Perrig}, title = {SDNsec: Forwarding Accountability for the {SDN} Data Plane}, journal = {CoRR}, volume = {abs/1605.01944}, year = {2016}, url = {http://arxiv.org/abs/1605.01944}, eprinttype = {arXiv}, eprint = {1605.01944}, timestamp = {Thu, 12 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/SasakiPLHP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PokeHG16, author = {Marius Poke and Torsten Hoefler and Colin W. Glass}, title = {AllConcur: Leaderless Concurrent Atomic Broadcast (Extended Version)}, journal = {CoRR}, volume = {abs/1608.05866}, year = {2016}, url = {http://arxiv.org/abs/1608.05866}, eprinttype = {arXiv}, eprint = {1608.05866}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/PokeHG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SolomonikBVH16, author = {Edgar Solomonik and Maciej Besta and Flavio Vella and Torsten Hoefler}, title = {Betweenness Centrality is more Parallelizable than Dense Matrix Multiplication}, journal = {CoRR}, volume = {abs/1609.07008}, year = {2016}, url = {http://arxiv.org/abs/1609.07008}, eprinttype = {arXiv}, eprint = {1609.07008}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SolomonikBVH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/WickySH16, author = {Tobias Wicky and Edgar Solomonik and Torsten Hoefler}, title = {Communication-Avoiding Parallel Algorithms for Solving Triangular Systems of Linear Equations}, journal = {CoRR}, volume = {abs/1612.01855}, year = {2016}, url = {http://arxiv.org/abs/1612.01855}, eprinttype = {arXiv}, eprint = {1612.01855}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/WickySH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijhpca/IskraH15, author = {Kamil Iskra and Torsten Hoefler}, title = {Operating systems and runtime environments on supercomputers}, journal = {Int. J. High Perform. Comput. Appl.}, volume = {29}, number = {1}, pages = {3--4}, year = {2015}, url = {https://doi.org/10.1177/1094342014560666}, doi = {10.1177/1094342014560666}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijhpca/IskraH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/topc/HoeflerDTBBGU15, author = {Torsten Hoefler and James Dinan and Rajeev Thakur and Brian Barrett and Pavan Balaji and William Gropp and Keith D. Underwood}, title = {Remote Memory Access Programming in {MPI-3}}, journal = {{ACM} Trans. Parallel Comput.}, volume = {2}, number = {2}, pages = {9:1--9:26}, year = {2015}, url = {https://doi.org/10.1145/2780584}, doi = {10.1145/2780584}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/topc/HoeflerDTBBGU15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/topc/DinitzH15, author = {Michael Dinitz and Torsten Hoefler}, title = {Introduction to the Special Issue on {SPAA} 2013}, journal = {{ACM} Trans. Parallel Comput.}, volume = {2}, number = {3}, pages = {14e:1--14e:2}, year = {2015}, url = {https://doi.org/10.1145/2809923}, doi = {10.1145/2809923}, timestamp = {Sat, 25 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/topc/DinitzH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/SchweizerBH15, author = {Hermann Schweizer and Maciej Besta and Torsten Hoefler}, title = {Evaluating the Cost of Atomic Operations on Modern Architectures}, booktitle = {2015 International Conference on Parallel Architectures and Compilation, {PACT} 2015, San Francisco, CA, USA, October 18-21, 2015}, pages = {445--456}, publisher = {{IEEE} Computer Society}, year = {2015}, url = {https://doi.org/10.1109/PACT.2015.24}, doi = {10.1109/PACT.2015.24}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/IEEEpact/SchweizerBH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/BhattacharyyaKH15, author = {Arnamoy Bhattacharyya and Grzegorz Kwasniewski and Torsten Hoefler}, title = {Using Compiler Techniques to Improve Automatic Performance Modeling}, booktitle = {2015 International Conference on Parallel Architectures and Compilation, {PACT} 2015, San Francisco, CA, USA, October 18-21, 2015}, pages = {468--479}, publisher = {{IEEE} Computer Society}, year = {2015}, url = {https://doi.org/10.1109/PACT.2015.39}, doi = {10.1109/PACT.2015.39}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/IEEEpact/BhattacharyyaKH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cfi/LeePBHHP15, author = {Taeho Lee and Christos Pappas and Cristina Basescu and Jun Han and Torsten Hoefler and Adrian Perrig}, title = {Source-Based Path Selection: The Data Plane Perspective}, booktitle = {The 10th International Conference on Future Internet, {CFI} '15, Seoul, Republic of Korea, June 8-10, 2015}, pages = {41--45}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2775088.2775090}, doi = {10.1145/2775088.2775090}, timestamp = {Thu, 12 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cfi/LeePBHHP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/GirolamoJUH15, author = {Salvatore Di Girolamo and Pierre Jolivet and Keith D. Underwood and Torsten Hoefler}, title = {Exploiting Offload Enabled Network Interfaces}, booktitle = {23rd {IEEE} Annual Symposium on High-Performance Interconnects, {HOTI} 2015, Santa Clara, CA, USA, August 26-28, 2015}, pages = {26--33}, publisher = {{IEEE} Computer Society}, year = {2015}, url = {https://doi.org/10.1109/HOTI.2015.21}, doi = {10.1109/HOTI.2015.21}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/GirolamoJUH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hotos/HoeflerRR15, author = {Torsten Hoefler and Robert B. Ross and Timothy Roscoe}, editor = {George Candea}, title = {Distributing the Data Plane for Remote Storage Access}, booktitle = {15th Workshop on Hot Topics in Operating Systems, HotOS XV, Kartause Ittingen, Switzerland, May 18-20, 2015}, publisher = {{USENIX} Association}, year = {2015}, url = {https://www.usenix.org/conference/hotos15/workshop-program/presentation/hoefler}, timestamp = {Wed, 04 Jul 2018 13:06:34 +0200}, biburl = {https://dblp.org/rec/conf/hotos/HoeflerRR15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/RamosH15, author = {Sabela Ramos and Torsten Hoefler}, editor = {Thilo Kielmann and Dean Hildebrand and Michela Taufer}, title = {Cache Line Aware Optimizations for ccNUMA Systems}, booktitle = {Proceedings of the 24th International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2015, Portland, OR, USA, June 15-19, 2015}, pages = {85--88}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2749246.2749256}, doi = {10.1145/2749246.2749256}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/RamosH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/PokeH15, author = {Marius Poke and Torsten Hoefler}, editor = {Thilo Kielmann and Dean Hildebrand and Michela Taufer}, title = {{DARE:} High-Performance State Machine Replication on {RDMA} Networks}, booktitle = {Proceedings of the 24th International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2015, Portland, OR, USA, June 15-19, 2015}, pages = {107--118}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2749246.2749267}, doi = {10.1145/2749246.2749267}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/PokeH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/BestaH15, author = {Maciej Besta and Torsten Hoefler}, editor = {Thilo Kielmann and Dean Hildebrand and Michela Taufer}, title = {Accelerating Irregular Computations with Hardware Transactional Memory and Active Messages}, booktitle = {Proceedings of the 24th International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2015, Portland, OR, USA, June 15-19, 2015}, pages = {161--172}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2749246.2749263}, doi = {10.1145/2749246.2749263}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/BestaH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/BestaH15, author = {Maciej Besta and Torsten Hoefler}, editor = {Laxmi N. Bhuyan and Fred Chong and Vivek Sarkar}, title = {Active Access: {A} Mechanism for High-Performance Distributed Data-Centric Computations}, booktitle = {Proceedings of the 29th {ACM} on International Conference on Supercomputing, ICS'15, Newport Beach/Irvine, CA, USA, June 08 - 11, 2015}, pages = {155--164}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2751205.2751219}, doi = {10.1145/2751205.2751219}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/BestaH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/ShudlerCHSW15, author = {Sergei Shudler and Alexandru Calotoiu and Torsten Hoefler and Alexandre Strube and Felix Wolf}, editor = {Laxmi N. Bhuyan and Fred Chong and Vivek Sarkar}, title = {Exascaling Your Library: Will Your Implementation Meet Your Expectations?}, booktitle = {Proceedings of the 29th {ACM} on International Conference on Supercomputing, ICS'15, Newport Beach/Irvine, CA, USA, June 08 - 11, 2015}, pages = {165--175}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2751205.2751216}, doi = {10.1145/2751205.2751216}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/ShudlerCHSW15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/GysiGH15, author = {Tobias Gysi and Tobias Grosser and Torsten Hoefler}, editor = {Laxmi N. Bhuyan and Fred Chong and Vivek Sarkar}, title = {{MODESTO:} Data-centric Analytic Optimization of Complex Stencil Programs on Heterogeneous Architectures}, booktitle = {Proceedings of the 29th {ACM} on International Conference on Supercomputing, ICS'15, Newport Beach/Irvine, CA, USA, June 08 - 11, 2015}, pages = {177--186}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2751205.2751223}, doi = {10.1145/2751205.2751223}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/GysiGH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerK15, author = {Torsten Hoefler and Laxmikant V. Kal{\'{e}}}, title = {{HIPS-LSPP} Keynotes}, booktitle = {2015 {IEEE} International Parallel and Distributed Processing Symposium Workshop, {IPDPS} 2015, Hyderabad, India, May 25-29, 2015}, pages = {204}, publisher = {{IEEE} Computer Society}, year = {2015}, url = {https://doi.org/10.1109/IPDPSW.2015.173}, doi = {10.1109/IPDPSW.2015.173}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerK15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/BelliH15, author = {Roberto Belli and Torsten Hoefler}, title = {Notified Access: Extending Remote Memory Access Programming Models for Producer-Consumer Synchronization}, booktitle = {2015 {IEEE} International Parallel and Distributed Processing Symposium, {IPDPS} 2015, Hyderabad, India, May 25-29, 2015}, pages = {871--881}, publisher = {{IEEE} Computer Society}, year = {2015}, url = {https://doi.org/10.1109/IPDPS.2015.30}, doi = {10.1109/IPDPS.2015.30}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/BelliH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/KathareiosMPRH15, author = {Georgios Kathareios and Cyriel Minkenberg and Bogdan Prisacari and Germ{\'{a}}n Rodr{\'{\i}}guez and Torsten Hoefler}, editor = {Jackie Kern and Jeffrey S. Vetter}, title = {Cost-effective diameter-two topologies: analysis and evaluation}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2015, Austin, TX, USA, November 15-20, 2015}, pages = {36:1--36:11}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2807591.2807652}, doi = {10.1145/2807591.2807652}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/KathareiosMPRH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerB15, author = {Torsten Hoefler and Roberto Belli}, editor = {Jackie Kern and Jeffrey S. Vetter}, title = {Scientific benchmarking of parallel computing systems: twelve ways to tell the masses when reporting performance results}, booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2015, Austin, TX, USA, November 15-20, 2015}, pages = {73:1--73:12}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2807591.2807644}, doi = {10.1145/2807591.2807644}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/HoeflerB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/hpdc/2015ross, editor = {Torsten Hoefler and Kamil Iskra}, title = {Proceedings of the 5th International Workshop on Runtime and Operating Systems for Supercomputers, {ROSS} 2015, Portland, OR, USA, June 16, 2015}, publisher = {{ACM}}, year = {2015}, url = {https://doi.org/10.1145/2768405}, doi = {10.1145/2768405}, isbn = {978-1-4503-3606-2}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/2015ross.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SolomonikH15, author = {Edgar Solomonik and Torsten Hoefler}, title = {Sparse Tensor Algebra as a Parallel Programming Model}, journal = {CoRR}, volume = {abs/1512.00066}, year = {2015}, url = {http://arxiv.org/abs/1512.00066}, eprinttype = {arXiv}, eprint = {1512.00066}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SolomonikH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cluster/0002HHS14, author = {Shigang Li and Torsten Hoefler and Chungjin Hu and Marc Snir}, title = {Improved {MPI} collectives for {MPI} processes in shared address spaces}, journal = {Clust. Comput.}, volume = {17}, number = {4}, pages = {1139--1155}, year = {2014}, url = {https://doi.org/10.1007/s10586-014-0361-4}, doi = {10.1007/S10586-014-0361-4}, timestamp = {Tue, 29 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/cluster/0002HHS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/computing/SchneiderGH14, author = {Timo Schneider and Robert Gerstenberger and Torsten Hoefler}, title = {Application-oriented ping-pong benchmarking: how to assess the real communication overheads}, journal = {Computing}, volume = {96}, number = {4}, pages = {279--292}, year = {2014}, url = {https://doi.org/10.1007/s00607-013-0330-4}, doi = {10.1007/S00607-013-0330-4}, timestamp = {Thu, 06 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/computing/SchneiderGH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/sp/GerstenbergerBH14, author = {Robert Gerstenberger and Maciej Besta and Torsten Hoefler}, title = {Enabling highly-scalable remote memory access programming with {MPI-3} One Sided}, journal = {Sci. Program.}, volume = {22}, number = {2}, pages = {75--91}, year = {2014}, url = {https://doi.org/10.3233/SPR-140383}, doi = {10.3233/SPR-140383}, timestamp = {Wed, 06 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/sp/GerstenbergerBH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/superfri/HoeflerM14, author = {Torsten Hoefler and Dmitry Moor}, title = {Energy, Memory, and Runtime Tradeoffs for Implementing Collective Communication Operations}, journal = {Supercomput. Front. Innov.}, volume = {1}, number = {2}, pages = {58--75}, year = {2014}, url = {https://doi.org/10.14529/jsfi140204}, doi = {10.14529/JSFI140204}, timestamp = {Wed, 16 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/superfri/HoeflerM14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/BhattacharyyaH14, author = {Arnamoy Bhattacharyya and Torsten Hoefler}, editor = {Jos{\'{e}} Nelson Amaral and Josep Torrellas}, title = {{PEMOGEN:} automatic adaptive performance modeling during program runtime}, booktitle = {International Conference on Parallel Architectures and Compilation, {PACT} '14, Edmonton, AB, Canada, August 24-27, 2014}, pages = {393--404}, publisher = {{ACM}}, year = {2014}, url = {https://doi.org/10.1145/2628071.2628100}, doi = {10.1145/2628071.2628100}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/IEEEpact/BhattacharyyaH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/europar/WolfBHMWCISV14, author = {Felix Wolf and Christian H. Bischof and Torsten Hoefler and Bernd Mohr and Gabriel Wittum and Alexandru Calotoiu and Christian Iwainsky and Alexandre Strube and Andreas Vogel}, editor = {Lu{\'{\i}}s M. B. Lopes and Julius Zilinskas and Alexandru Costan and Roberto G. Cascella and Gabor Kecskemeti and Emmanuel Jeannot and Mario Cannataro and Laura Ricci and Siegfried Benkner and Salvador Petit and Vittorio Scarano and Jos{\'{e}} Gracia and Sascha Hunold and Stephen L. Scott and Stefan Lankes and Christian Lengauer and Jes{\'{u}}s Carretero and Jens Breitbart and Michael Alexander}, title = {Catwalk: {A} Quick Development Path for Performance Models}, booktitle = {Euro-Par 2014: Parallel Processing Workshops - Euro-Par 2014 International Workshops, Porto, Portugal, August 25-26, 2014, Revised Selected Papers, Part {II}}, series = {Lecture Notes in Computer Science}, volume = {8806}, pages = {589--600}, publisher = {Springer}, year = {2014}, url = {https://doi.org/10.1007/978-3-319-14313-2\_50}, doi = {10.1007/978-3-319-14313-2\_50}, timestamp = {Sun, 12 Nov 2023 02:07:45 +0100}, biburl = {https://dblp.org/rec/conf/europar/WolfBHMWCISV14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/BestaH14, author = {Maciej Besta and Torsten Hoefler}, editor = {Beth Plale and Matei Ripeanu and Franck Cappello and Dongyan Xu}, title = {Fault tolerance for remote memory access programming models}, booktitle = {The 23rd International Symposium on High-Performance Parallel and Distributed Computing, HPDC'14, Vancouver, BC, Canada - June 23 - 27, 2014}, pages = {37--48}, publisher = {{ACM}}, year = {2014}, url = {https://doi.org/10.1145/2600212.2600224}, doi = {10.1145/2600212.2600224}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/BestaH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/PrisacariRHCMH14, author = {Bogdan Prisacari and Germ{\'{a}}n Rodr{\'{\i}}guez and Philip Heidelberger and Dong Chen and Cyriel Minkenberg and Torsten Hoefler}, editor = {Beth Plale and Matei Ripeanu and Franck Cappello and Dongyan Xu}, title = {Efficient task placement and routing of nearest neighbor exchanges in dragonfly networks}, booktitle = {The 23rd International Symposium on High-Performance Parallel and Distributed Computing, HPDC'14, Vancouver, BC, Canada - June 23 - 27, 2014}, pages = {129--140}, publisher = {{ACM}}, year = {2014}, url = {https://doi.org/10.1145/2600212.2600225}, doi = {10.1145/2600212.2600225}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/PrisacariRHCMH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/ArteagaFH14, author = {Andrea Arteaga and Oliver Fuhrer and Torsten Hoefler}, title = {Designing Bit-Reproducible Portable High-Performance Applications}, booktitle = {2014 {IEEE} 28th International Parallel and Distributed Processing Symposium, Phoenix, AZ, USA, May 19-23, 2014}, pages = {1235--1244}, publisher = {{IEEE} Computer Society}, year = {2014}, url = {https://doi.org/10.1109/IPDPS.2014.127}, doi = {10.1109/IPDPS.2014.127}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/ArteagaFH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/WidenerFLH14, author = {Patrick M. Widener and Kurt B. Ferreira and Scott Levy and Torsten Hoefler}, editor = {Jack J. Dongarra and Yutaka Ishikawa and Atsushi Hori}, title = {Exploring the effect of noise on the performance benefit of nonblocking allreduce}, booktitle = {21st European {MPI} Users' Group Meeting, EuroMPI/ASIA '14, Kyoto, Japan - September 09 - 12, 2014}, pages = {77}, publisher = {{ACM}}, year = {2014}, url = {https://doi.org/10.1145/2642769.2642786}, doi = {10.1145/2642769.2642786}, timestamp = {Sun, 12 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/pvm/WidenerFLH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/BestaH14, author = {Maciej Besta and Torsten Hoefler}, editor = {Trish Damkroger and Jack J. Dongarra}, title = {Slim Fly: {A} Cost Effective Low-Diameter Network Topology}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2014, New Orleans, LA, USA, November 16-21, 2014}, pages = {348--359}, publisher = {{IEEE} Computer Society}, year = {2014}, url = {https://doi.org/10.1109/SC.2014.34}, doi = {10.1109/SC.2014.34}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/BestaH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/DomkeHM14, author = {Jens Domke and Torsten Hoefler and Satoshi Matsuoka}, editor = {Trish Damkroger and Jack J. Dongarra}, title = {Fail-in-Place Network Design: Interaction Between Topology, Routing Algorithm and Failures}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2014, New Orleans, LA, USA, November 16-21, 2014}, pages = {597--608}, publisher = {{IEEE} Computer Society}, year = {2014}, url = {https://doi.org/10.1109/SC.2014.54}, doi = {10.1109/SC.2014.54}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/DomkeHM14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/FerreiraWLAH14, author = {Kurt B. Ferreira and Patrick M. Widener and Scott Levy and Dorian C. Arnold and Torsten Hoefler}, editor = {Trish Damkroger and Jack J. Dongarra}, title = {Understanding the Effects of Communication and Coordination on Checkpointing at Scale}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, {SC} 2014, New Orleans, LA, USA, November 16-21, 2014}, pages = {883--894}, publisher = {{IEEE} Computer Society}, year = {2014}, url = {https://doi.org/10.1109/SC.2014.77}, doi = {10.1109/SC.2014.77}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/FerreiraWLAH14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/HoeflerK14, author = {Torsten Hoefler and Grzegorz Kwasniewski}, editor = {Guy E. Blelloch and Peter Sanders}, title = {Automatic complexity analysis of explicitly parallel programs}, booktitle = {26th {ACM} Symposium on Parallelism in Algorithms and Architectures, {SPAA} '14, Prague, Czech Republic - June 23 - 25, 2014}, pages = {226--235}, publisher = {{ACM}}, year = {2014}, url = {https://doi.org/10.1145/2612669.2612685}, doi = {10.1145/2612669.2612685}, timestamp = {Wed, 21 Nov 2018 11:18:43 +0100}, biburl = {https://dblp.org/rec/conf/spaa/HoeflerK14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/ics/2014ross, editor = {Kamil Iskra and Torsten Hoefler}, title = {Proceedings of the 4th International Workshop on Runtime and Operating Systems for Supercomputers, {ROSS} 2014, Munich, Germany, June 10, 2014}, publisher = {{ACM}}, year = {2014}, url = {https://doi.org/10.1145/2612262}, doi = {10.1145/2612262}, isbn = {978-1-4503-2950-7}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/2014ross.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/computing/HoeflerDBBBBGKT13, author = {Torsten Hoefler and James Dinan and Darius Buntinas and Pavan Balaji and Brian Barrett and Ron Brightwell and William Gropp and Vivek Kale and Rajeev Thakur}, title = {{MPI} + {MPI:} a new hybrid approach to parallel programming with {MPI} plus shared memory}, journal = {Computing}, volume = {95}, number = {12}, pages = {1121--1136}, year = {2013}, url = {https://doi.org/10.1007/s00607-013-0324-2}, doi = {10.1007/S00607-013-0324-2}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/computing/HoeflerDBBBBGKT13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijhpca/HoeflerI13, author = {Torsten Hoefler and Kamil Iskra}, title = {Operating systems and runtime environments on supercomputers}, journal = {Int. J. High Perform. Comput. Appl.}, volume = {27}, number = {2}, pages = {123}, year = {2013}, url = {https://doi.org/10.1177/1094342013481376}, doi = {10.1177/1094342013481376}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijhpca/HoeflerI13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taco/PrisacariRMH13, author = {Bogdan Prisacari and Germ{\'{a}}n Rodr{\'{\i}}guez and Cyriel Minkenberg and Torsten Hoefler}, title = {Fast pattern-specific routing for fat tree networks}, journal = {{ACM} Trans. Archit. Code Optim.}, volume = {10}, number = {4}, pages = {36:1--36:25}, year = {2013}, url = {https://doi.org/10.1145/2541228.2555293}, doi = {10.1145/2541228.2555293}, timestamp = {Wed, 17 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/taco/PrisacariRMH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/europar/LysneHLB13, author = {Olav Lysne and Torsten Hoefler and Pedro L{\'{o}}pez and Davide Bertozzi}, editor = {Felix Wolf and Bernd Mohr and Dieter an Mey}, title = {Topic 13: High-Performance Networks and Communication - (Introduction)}, booktitle = {Euro-Par 2013 Parallel Processing - 19th International Conference, Aachen, Germany, August 26-30, 2013. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {8097}, pages = {684}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-642-40047-6\_68}, doi = {10.1007/978-3-642-40047-6\_68}, timestamp = {Tue, 14 May 2019 10:00:46 +0200}, biburl = {https://dblp.org/rec/conf/europar/LysneHLB13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/LiHS13, author = {Shigang Li and Torsten Hoefler and Marc Snir}, editor = {Manish Parashar and Jon B. Weissman and Dick H. J. Epema and Renato J. O. Figueiredo}, title = {NUMA-aware shared-memory collective communication for {MPI}}, booktitle = {The 22nd International Symposium on High-Performance Parallel and Distributed Computing, HPDC'13, New York, NY, {USA} - June 17 - 21, 2013}, pages = {85--96}, publisher = {{ACM}}, year = {2013}, url = {https://dl.acm.org/citation.cfm?id=2462903}, timestamp = {Mon, 26 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/LiHS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/RamosH13, author = {Sabela Ramos and Torsten Hoefler}, editor = {Manish Parashar and Jon B. Weissman and Dick H. J. Epema and Renato J. O. Figueiredo}, title = {Modeling communication in cache-coherent {SMP} systems: a case-study with Xeon Phi}, booktitle = {The 22nd International Symposium on High-Performance Parallel and Distributed Computing, HPDC'13, New York, NY, {USA} - June 17 - 21, 2013}, pages = {97--108}, publisher = {{ACM}}, year = {2013}, url = {https://dl.acm.org/citation.cfm?id=2462916}, timestamp = {Mon, 26 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hpdc/RamosH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icpp/SchneiderHGBB13, author = {Timo Schneider and Torsten Hoefler and Ryan E. Grant and Brian W. Barrett and Ron Brightwell}, title = {Protocols for Fully Offloaded Collective Operations on Accelerated Network Adapters}, booktitle = {42nd International Conference on Parallel Processing, {ICPP} 2013, Lyon, France, October 1-4, 2013}, pages = {593--602}, publisher = {{IEEE} Computer Society}, year = {2013}, url = {https://doi.org/10.1109/ICPP.2013.73}, doi = {10.1109/ICPP.2013.73}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icpp/SchneiderHGBB13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/PrisacariRMH13, author = {Bogdan Prisacari and Germ{\'{a}}n Rodr{\'{\i}}guez and Cyriel Minkenberg and Torsten Hoefler}, editor = {Allen D. Malony and Mario Nemirovsky and Samuel P. Midkiff}, title = {Bandwidth-optimal all-to-all exchanges in fat tree networks}, booktitle = {International Conference on Supercomputing, ICS'13, Eugene, OR, {USA} - June 10 - 14, 2013}, pages = {139--148}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2464996.2465434}, doi = {10.1145/2464996.2465434}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/PrisacariRMH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/lcpc/SchneiderGH13, author = {Timo Schneider and Robert Gerstenberger and Torsten Hoefler}, editor = {Calin Cascaval and Pablo Montesinos}, title = {Compiler Optimizations for Non-contiguous Remote Data Movement}, booktitle = {Languages and Compilers for Parallel Computing - 26th International Workshop, {LCPC} 2013, San Jose, CA, USA, September 25-27, 2013. Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {8664}, pages = {307--321}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-319-09967-5\_18}, doi = {10.1007/978-3-319-09967-5\_18}, timestamp = {Tue, 14 May 2019 10:00:47 +0200}, biburl = {https://dblp.org/rec/conf/lcpc/SchneiderGH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/FriedleyHBLM13, author = {Andrew Friedley and Torsten Hoefler and Greg Bronevetsky and Andrew Lumsdaine and Ching{-}Chen Ma}, editor = {Alex Nicolau and Xiaowei Shen and Saman P. Amarasinghe and Richard W. Vuduc}, title = {Ownership passing: efficient distributed memory programming on multi-core systems}, booktitle = {{ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, PPoPP '13, Shenzhen, China, February 23-27, 2013}, pages = {177--186}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2442516.2442534}, doi = {10.1145/2442516.2442534}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/FriedleyHBLM13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/SchneiderKH13, author = {Timo Schneider and Fredrik Kjolstad and Torsten Hoefler}, editor = {Jack J. Dongarra and Javier Garc{\'{\i}}a Blas and Jes{\'{u}}s Carretero}, title = {{MPI} datatype processing using runtime compilation}, booktitle = {20th European {MPI} Users's Group Meeting, EuroMPI '13, Madrid, Spain - September 15 - 18, 2013}, pages = {19--24}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2488551.2488552}, doi = {10.1145/2488551.2488552}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/SchneiderKH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/FriedleyBHL13, author = {Andrew Friedley and Greg Bronevetsky and Torsten Hoefler and Andrew Lumsdaine}, editor = {William Gropp and Satoshi Matsuoka}, title = {Hybrid {MPI:} efficient message passing for multi-core systems}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, SC'13, Denver, CO, {USA} - November 17 - 21, 2013}, pages = {18:1--18:11}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2503210.2503294}, doi = {10.1145/2503210.2503294}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/FriedleyBHL13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/CalotoiuHPW13, author = {Alexandru Calotoiu and Torsten Hoefler and Marius Poke and Felix Wolf}, editor = {William Gropp and Satoshi Matsuoka}, title = {Using automated performance modeling to find scalability bugs in complex codes}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, SC'13, Denver, CO, {USA} - November 17 - 21, 2013}, pages = {45:1--45:12}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2503210.2503277}, doi = {10.1145/2503210.2503277}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/CalotoiuHPW13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/GerstenbergerBH13, author = {Robert Gerstenberger and Maciej Besta and Torsten Hoefler}, editor = {William Gropp and Satoshi Matsuoka}, title = {Enabling highly-scalable remote memory access programming with {MPI-3} one sided}, booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis, SC'13, Denver, CO, {USA} - November 17 - 21, 2013}, pages = {53:1--53:12}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2503210.2503286}, doi = {10.1145/2503210.2503286}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/GerstenbergerBH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/LevyTFAHW13, author = {Scott Levy and Bryan Topp and Kurt B. Ferreira and Dorian C. Arnold and Torsten Hoefler and Patrick M. Widener}, editor = {Stephen A. Jarvis and Steven A. Wright and Simon D. Hammond}, title = {Using Simulation to Evaluate the Performance of Resilience Strategies at Scale}, booktitle = {High Performance Computing Systems. Performance Modeling, Benchmarking and Simulation - 4th International Workshop, {PMBS} 2013, Denver, CO, USA, November 18, 2013. Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {8551}, pages = {91--114}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-319-10214-6\_5}, doi = {10.1007/978-3-319-10214-6\_5}, timestamp = {Sun, 12 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/LevyTFAHW13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/ics/2013ross, editor = {Torsten Hoefler and Kamil Iskra}, title = {Proceedings of the 3rd International Workshop on Runtime and Operating Systems for Supercomputers, {ROSS} 2013, Eugene, Oregon, USA, June 10, 2013}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2491661}, doi = {10.1145/2491661}, isbn = {978-1-4503-2146-4}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/2013ross.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijhpca/HoeflerI12, author = {Torsten Hoefler and Kamil Iskra}, title = {Operating systems and runtime environments on supercomputers}, journal = {Int. J. High Perform. Comput. Appl.}, volume = {26}, number = {2}, pages = {93--94}, year = {2012}, url = {https://doi.org/10.1177/1094342012442456}, doi = {10.1177/1094342012442456}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijhpca/HoeflerI12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/micro/HoeflerGPT12, author = {Torsten Hoefler and Patrick Geoffray and Fabrizio Petrini and Jesper Larsson Tr{\"{a}}ff}, title = {Top Picks from Hot Interconnects 2011: Petascale Network Architectures}, journal = {{IEEE} Micro}, volume = {32}, number = {1}, pages = {4--7}, year = {2012}, url = {https://doi.org/10.1109/MM.2012.11}, doi = {10.1109/MM.2012.11}, timestamp = {Wed, 11 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/micro/HoeflerGPT12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pc/Hoefler12, author = {Torsten Hoefler}, title = {Extensions for next-generation parallel programming models}, journal = {Parallel Comput.}, volume = {38}, number = {1-2}, pages = {1}, year = {2012}, url = {https://doi.org/10.1016/j.parco.2011.10.012}, doi = {10.1016/J.PARCO.2011.10.012}, timestamp = {Sat, 22 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/pc/Hoefler12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/HoeflerS12, author = {Torsten Hoefler and Timo Schneider}, editor = {Pen{-}Chung Yew and Sangyeun Cho and Luiz DeRose and David J. Lilja}, title = {Runtime detection and optimization of collective communication patterns}, booktitle = {International Conference on Parallel Architectures and Compilation Techniques, {PACT} '12, Minneapolis, MN, {USA} - September 19 - 23, 2012}, pages = {263--272}, publisher = {{ACM}}, year = {2012}, url = {https://doi.org/10.1145/2370816.2370856}, doi = {10.1145/2370816.2370856}, timestamp = {Wed, 11 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/IEEEpact/HoeflerS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ccgrid/GottschlingH12, author = {Peter Gottschling and Torsten Hoefler}, title = {Productive Parallel Linear Algebra Programming with Unstructured Topology Adaption}, booktitle = {12th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid Computing, CCGrid 2012, Ottawa, Canada, May 13-16, 2012}, pages = {9--16}, publisher = {{IEEE} Computer Society}, year = {2012}, url = {https://doi.org/10.1109/CCGrid.2012.51}, doi = {10.1109/CCGRID.2012.51}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ccgrid/GottschlingH12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ccgrid/BauerGH12, author = {Greg Bauer and Steven Gottlieb and Torsten Hoefler}, title = {Performance Modeling and Comparative Analysis of the {MILC} Lattice {QCD} Application su3{\_}rmd}, booktitle = {12th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid Computing, CCGrid 2012, Ottawa, Canada, May 13-16, 2012}, pages = {652--659}, publisher = {{IEEE} Computer Society}, year = {2012}, url = {https://doi.org/10.1109/CCGrid.2012.123}, doi = {10.1109/CCGRID.2012.123}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ccgrid/BauerGH12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cluster/PellegriniHF12, author = {Simone Pellegrini and Torsten Hoefler and Thomas Fahringer}, title = {On the Effects of {CPU} Caches on {MPI} Point-to-Point Communications}, booktitle = {2012 {IEEE} International Conference on Cluster Computing, {CLUSTER} 2012, Beijing, China, September 24-28, 2012}, pages = {495--503}, publisher = {{IEEE} Computer Society}, year = {2012}, url = {https://doi.org/10.1109/CLUSTER.2012.22}, doi = {10.1109/CLUSTER.2012.22}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cluster/PellegriniHF12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pdp/KharbasKHM12, author = {Kishor Kharbas and Donghoon Kim and Torsten Hoefler and Frank Mueller}, editor = {Rainer Stotzka and Michael Schiffers and Yannis Cotronis}, title = {Assessing {HPC} Failure Detectors for {MPI} Jobs}, booktitle = {Proceedings of the 20th Euromicro International Conference on Parallel, Distributed and Network-Based Processing, {PDP} 2012, Munich, Germany, February 15-17, 2012}, pages = {81--88}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/PDP.2012.11}, doi = {10.1109/PDP.2012.11}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/pdp/KharbasKHM12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/HoeflerS12, author = {Torsten Hoefler and Timo Schneider}, editor = {J. Ramanujam and P. Sadayappan}, title = {Communication-centric optimizations by dynamically detecting collective operations}, booktitle = {Proceedings of the 17th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, {PPOPP} 2012, New Orleans, LA, USA, February 25-29, 2012}, pages = {305--306}, publisher = {{ACM}}, year = {2012}, url = {https://doi.org/10.1145/2145816.2145866}, doi = {10.1145/2145816.2145866}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/HoeflerS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/KjolstadHS12, author = {Fredrik Kjolstad and Torsten Hoefler and Marc Snir}, editor = {J. Ramanujam and P. Sadayappan}, title = {Automatic datatype generation and optimization}, booktitle = {Proceedings of the 17th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, {PPOPP} 2012, New Orleans, LA, USA, February 25-29, 2012}, pages = {327--328}, publisher = {{ACM}}, year = {2012}, url = {https://doi.org/10.1145/2145816.2145878}, doi = {10.1145/2145816.2145878}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/KjolstadHS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/PellegriniHF12, author = {Simone Pellegrini and Torsten Hoefler and Thomas Fahringer}, editor = {Jesper Larsson Tr{\"{a}}ff and Siegfried Benkner and Jack J. Dongarra}, title = {Exact Dependence Analysis for Increased Communication Overlap}, booktitle = {Recent Advances in the Message Passing Interface - 19th European {MPI} Users' Group Meeting, EuroMPI 2012, Vienna, Austria, September 23-26, 2012. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {7490}, pages = {89--99}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-33518-1\_14}, doi = {10.1007/978-3-642-33518-1\_14}, timestamp = {Sun, 25 Jul 2021 11:50:18 +0200}, biburl = {https://dblp.org/rec/conf/pvm/PellegriniHF12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/SchneiderGH12, author = {Timo Schneider and Robert Gerstenberger and Torsten Hoefler}, editor = {Jesper Larsson Tr{\"{a}}ff and Siegfried Benkner and Jack J. Dongarra}, title = {Micro-applications for Communication Data Access Patterns and {MPI} Datatypes}, booktitle = {Recent Advances in the Message Passing Interface - 19th European {MPI} Users' Group Meeting, EuroMPI 2012, Vienna, Austria, September 23-26, 2012. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {7490}, pages = {121--131}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-33518-1\_17}, doi = {10.1007/978-3-642-33518-1\_17}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/SchneiderGH12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerDBBBBGKT12, author = {Torsten Hoefler and James Dinan and Darius Buntinas and Pavan Balaji and Brian W. Barrett and Ron Brightwell and William Gropp and Vivek Kale and Rajeev Thakur}, editor = {Jesper Larsson Tr{\"{a}}ff and Siegfried Benkner and Jack J. Dongarra}, title = {Leveraging MPI's One-Sided Communication Interface for Shared-Memory Programming}, booktitle = {Recent Advances in the Message Passing Interface - 19th European {MPI} Users' Group Meeting, EuroMPI 2012, Vienna, Austria, September 23-26, 2012. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {7490}, pages = {132--141}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-33518-1\_18}, doi = {10.1007/978-3-642-33518-1\_18}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerDBBBBGKT12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerS12, author = {Torsten Hoefler and Timo Schneider}, editor = {Jeffrey K. Hollingsworth}, title = {Optimization principles for collective neighborhood communications}, booktitle = {{SC} Conference on High Performance Computing Networking, Storage and Analysis, {SC} '12, Salt Lake City, UT, {USA} - November 11 - 15, 2012}, pages = {98}, publisher = {{IEEE/ACM}}, year = {2012}, url = {https://doi.org/10.1109/SC.2012.86}, doi = {10.1109/SC.2012.86}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/HoeflerS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/KaleGHSG12, author = {Vivek Kale and Todd Gamblin and Torsten Hoefler and Bronis R. de Supinski and William D. Gropp}, title = {Abstract: Slack-Conscious Lightweight Loop Scheduling for Improving Scalability of Bulk-synchronous {MPI} Applications}, booktitle = {2012 {SC} Companion: High Performance Computing, Networking Storage and Analysis, Salt Lake City, UT, USA, November 10-16, 2012}, pages = {1392}, publisher = {{IEEE} Computer Society}, year = {2012}, url = {https://doi.org/10.1109/SC.Companion.2012.209}, doi = {10.1109/SC.COMPANION.2012.209}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/KaleGHSG12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/ics/2012ross, editor = {Torsten Hoefler and Kamil Iskra}, title = {Proceedings of the 2nd International Workshop on Runtime and Operating Systems for Supercomputers, {ROSS} '12, Venice, Italy, June 29, 2012}, publisher = {{ACM}}, year = {2012}, url = {https://doi.org/10.1145/2318916}, doi = {10.1145/2318916}, isbn = {978-1-4503-1460-2}, timestamp = {Wed, 12 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ics/2012ross.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/concurrency/HoeflerRRSTT11, author = {Torsten Hoefler and Rolf Rabenseifner and Hubert Ritzdorf and Bronis R. de Supinski and Rajeev Thakur and Jesper Larsson Tr{\"{a}}ff}, title = {The scalable process topology interface of {MPI} 2.2}, journal = {Concurr. Comput. Pract. Exp.}, volume = {23}, number = {4}, pages = {293--310}, year = {2011}, url = {https://doi.org/10.1002/cpe.1643}, doi = {10.1002/CPE.1643}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/concurrency/HoeflerRRSTT11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ppl/BalajiBGGHKLTT11, author = {Pavan Balaji and Darius Buntinas and David Goodell and William Gropp and Torsten Hoefler and Sameer Kumar and Ewing L. Lusk and Rajeev Thakur and Jesper Larsson Tr{\"{a}}ff}, title = {Mpi on millions of Cores}, journal = {Parallel Process. Lett.}, volume = {21}, number = {1}, pages = {45--60}, year = {2011}, url = {https://doi.org/10.1142/S0129626411000060}, doi = {10.1142/S0129626411000060}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ppl/BalajiBGGHKLTT11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/europar/SchneiderEHR11, author = {Timo Schneider and Sven Eckelmann and Torsten Hoefler and Wolfgang Rehm}, editor = {Emmanuel Jeannot and Raymond Namyst and Jean Roman}, title = {Kernel-Based Offload of Collective Operations - Implementation, Evaluation and Lessons Learned}, booktitle = {Euro-Par 2011 Parallel Processing - 17th International Conference, Euro-Par 2011, Bordeaux, France, August 29 - September 2, 2011, Proceedings, Part {II}}, series = {Lecture Notes in Computer Science}, volume = {6853}, pages = {264--275}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-23397-5\_26}, doi = {10.1007/978-3-642-23397-5\_26}, timestamp = {Tue, 14 May 2019 10:00:46 +0200}, biburl = {https://dblp.org/rec/conf/europar/SchneiderEHR11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/HoeflerS11, author = {Torsten Hoefler and Marc Snir}, editor = {David K. Lowenthal and Bronis R. de Supinski and Sally A. McKee}, title = {Generic topology mapping strategies for large-scale parallel architectures}, booktitle = {Proceedings of the 25th International Conference on Supercomputing, 2011, Tucson, AZ, USA, May 31 - June 04, 2011}, pages = {75--84}, publisher = {{ACM}}, year = {2011}, url = {https://doi.org/10.1145/1995896.1995909}, doi = {10.1145/1995896.1995909}, timestamp = {Tue, 06 Nov 2018 11:07:03 +0100}, biburl = {https://dblp.org/rec/conf/ics/HoeflerS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ics/WillcockHEL11, author = {Jeremiah Willcock and Torsten Hoefler and Nicholas Gerard Edmonds and Andrew Lumsdaine}, editor = {David K. Lowenthal and Bronis R. de Supinski and Sally A. McKee}, title = {Active pebbles: parallel programming for data-driven applications}, booktitle = {Proceedings of the 25th International Conference on Supercomputing, 2011, Tucson, AZ, USA, May 31 - June 04, 2011}, pages = {235--244}, publisher = {{ACM}}, year = {2011}, url = {https://doi.org/10.1145/1995896.1995934}, doi = {10.1145/1995896.1995934}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ics/WillcockHEL11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/DomkeHN11, author = {Jens Domke and Torsten Hoefler and Wolfgang E. Nagel}, title = {Deadlock-Free Oblivious Routing for Arbitrary Topologies}, booktitle = {25th {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2011, Anchorage, Alaska, USA, 16-20 May, 2011 - Conference Proceedings}, pages = {616--627}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/IPDPS.2011.65}, doi = {10.1109/IPDPS.2011.65}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/DomkeHN11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/Hoefler11, author = {Torsten Hoefler}, title = {{HIPS} Introduction}, booktitle = {25th {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2011, Anchorage, Alaska, USA, 16-20 May 2011 - Workshop Proceedings}, pages = {1139--1140}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/IPDPS.2011.405}, doi = {10.1109/IPDPS.2011.405}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/Hoefler11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/padl/HolkBWHCL11, author = {Eric Holk and William E. Byrd and Jeremiah Willcock and Torsten Hoefler and Arun Chauhan and Andrew Lumsdaine}, editor = {Ricardo Rocha and John Launchbury}, title = {Kanor - {A} Declarative Language for Explicit Communication}, booktitle = {Practical Aspects of Declarative Languages - 13th International Symposium, {PADL} 2011, Austin, TX, USA, January 24-25, 2011. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6539}, pages = {190--204}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-18378-2\_16}, doi = {10.1007/978-3-642-18378-2\_16}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/padl/HolkBWHCL11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/WillcockHEL11, author = {Jeremiah Willcock and Torsten Hoefler and Nicholas Gerard Edmonds and Andrew Lumsdaine}, editor = {Calin Cascaval and Pen{-}Chung Yew}, title = {Active pebbles: a programming model for highly parallel fine-grained data-driven computations}, booktitle = {Proceedings of the 16th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, {PPOPP} 2011, San Antonio, TX, USA, February 12-16, 2011}, pages = {305--306}, publisher = {{ACM}}, year = {2011}, url = {https://doi.org/10.1145/1941553.1941601}, doi = {10.1145/1941553.1941601}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/WillcockHEL11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/VenkatesanCGH11, author = {Vishwanath Venkatesan and Mohamad Chaarawi and Edgar Gabriel and Torsten Hoefler}, editor = {Yiannis Cotronis and Anthony Danalis and Dimitrios S. Nikolopoulos and Jack J. Dongarra}, title = {Design and Evaluation of Nonblocking Collective {I/O} Operations}, booktitle = {Recent Advances in the Message Passing Interface - 18th European {MPI} Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21, 2011. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6960}, pages = {90--98}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-24449-0\_12}, doi = {10.1007/978-3-642-24449-0\_12}, timestamp = {Tue, 14 May 2019 10:00:52 +0200}, biburl = {https://dblp.org/rec/conf/pvm/VenkatesanCGH11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/GroppHTT11, author = {William Gropp and Torsten Hoefler and Rajeev Thakur and Jesper Larsson Tr{\"{a}}ff}, editor = {Yiannis Cotronis and Anthony Danalis and Dimitrios S. Nikolopoulos and Jack J. Dongarra}, title = {Performance Expectations and Guidelines for {MPI} Derived Datatypes}, booktitle = {Recent Advances in the Message Passing Interface - 18th European {MPI} Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21, 2011. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6960}, pages = {150--159}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-24449-0\_18}, doi = {10.1007/978-3-642-24449-0\_18}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/GroppHTT11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerS11, author = {Torsten Hoefler and Marc Snir}, editor = {Yiannis Cotronis and Anthony Danalis and Dimitrios S. Nikolopoulos and Jack J. Dongarra}, title = {Writing Parallel Libraries with {MPI} - Common Practice, Issues, and Extensions}, booktitle = {Recent Advances in the Message Passing Interface - 18th European {MPI} Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21, 2011. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6960}, pages = {345--355}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-24449-0\_45}, doi = {10.1007/978-3-642-24449-0\_45}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerGKS11, author = {Torsten Hoefler and William Gropp and William Kramer and Marc Snir}, editor = {Scott A. Lathrop and Jim Costa and William Kramer}, title = {Performance modeling for systematic performance tuning}, booktitle = {Conference on High Performance Computing Networking, Storage and Analysis - State of the Practice Reports, {SC} 2011, Seattle, Washington, USA, November 12-18, 2011}, pages = {6:1--6:12}, publisher = {{ACM}}, year = {2011}, url = {https://doi.org/10.1145/2063348.2063356}, doi = {10.1145/2063348.2063356}, timestamp = {Fri, 03 Jul 2020 08:57:23 +0200}, biburl = {https://dblp.org/rec/conf/sc/HoeflerGKS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/tg/HarrellSSHLO11, author = {Stephen Lien Harrell and Preston M. Smith and Doug Smith and Torsten Hoefler and Anna A. Labutina and Trinity Overmyer}, editor = {John Towns and Shawn Brown and Daniel S. Katz}, title = {Methods of creating student cluster competition teams}, booktitle = {Proceedings of the 2011 TeraGrid Conference - Extreme Digital Discovery, {TG} '11, Salt Lake City, Utah, USA, July 18-21, 2011}, pages = {50:1--50:6}, publisher = {{ACM}}, year = {2011}, url = {https://doi.org/10.1145/2016741.2016795}, doi = {10.1145/2016741.2016795}, timestamp = {Sat, 09 Apr 2022 12:46:56 +0200}, biburl = {https://dblp.org/rec/conf/tg/HarrellSSHLO11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cse/Hoefler10, author = {Torsten Hoefler}, title = {Software and Hardware Techniques for Power-Efficient {HPC} Networking}, journal = {Comput. Sci. Eng.}, volume = {12}, number = {6}, pages = {30--37}, year = {2010}, url = {https://doi.org/10.1109/MCSE.2010.96}, doi = {10.1109/MCSE.2010.96}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/cse/Hoefler10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/paapp/HoeflerSL10, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {Accurately measuring overhead, communication time and progression of blocking and nonblocking collective operations at massive scale}, journal = {Int. J. Parallel Emergent Distributed Syst.}, volume = {25}, number = {4}, pages = {241--258}, year = {2010}, url = {https://doi.org/10.1080/17445760902894688}, doi = {10.1080/17445760902894688}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/paapp/HoeflerSL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/IEEEpact/WillcockHEL10, author = {Jeremiah Willcock and Torsten Hoefler and Nicholas Gerard Edmonds and Andrew Lumsdaine}, editor = {Valentina Salapura and Michael Gschwind and Jens Knoop}, title = {{AM++:} a generalized active message framework}, booktitle = {19th International Conference on Parallel Architectures and Compilation Techniques, {PACT} 2010, Vienna, Austria, September 11-15, 2010}, pages = {401--410}, publisher = {{ACM}}, year = {2010}, url = {https://doi.org/10.1145/1854273.1854323}, doi = {10.1145/1854273.1854323}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/IEEEpact/WillcockHEL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/europar/Hoefler10, author = {Torsten Hoefler}, editor = {Mario R. Guarracino and Fr{\'{e}}d{\'{e}}ric Vivien and Jesper Larsson Tr{\"{a}}ff and Mario Cannataro and Marco Danelutto and Anders Hast and Francesca Perla and Andreas Kn{\"{u}}pfer and Beniamino Di Martino and Michael Alexander}, title = {Bridging Performance Analysis Tools and Analytic Performance Modeling for {HPC}}, booktitle = {Euro-Par 2010 Parallel Processing Workshops - HeteroPar, HPCC, HiBB, CoreGrid, UCHPC, HPCF, PROPER, CCPI, VHPC, Ischia, Italy, August 31-September 3, 2010, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {6586}, pages = {483--491}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-21878-1\_60}, doi = {10.1007/978-3-642-21878-1\_60}, timestamp = {Wed, 19 Feb 2020 14:52:57 +0100}, biburl = {https://dblp.org/rec/conf/europar/Hoefler10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hipc/EdmondsHL10, author = {Nick Edmonds and Torsten Hoefler and Andrew Lumsdaine}, title = {A space-efficient parallel algorithm for computing betweenness centrality in distributed memory}, booktitle = {2010 International Conference on High Performance Computing, HiPC 2010, Dona Paula, Goa, India, December 19-22, 2010}, pages = {1--10}, publisher = {{IEEE} Computer Society}, year = {2010}, url = {https://doi.org/10.1109/HIPC.2010.5713180}, doi = {10.1109/HIPC.2010.5713180}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hipc/EdmondsHL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/ArimilliACCDDHJLLNR10, author = {L. Baba Arimilli and Ravi Arimilli and Vicente Chung and Scott Clark and Wolfgang E. Denzel and Ben C. Drerup and Torsten Hoefler and Jody B. Joyner and Jerry Lewis and Jian Li and Nan Ni and Ramakrishnan Rajamony}, editor = {Fabrizio Petrini and Dennis Abts and Ron Brightwell and Pavan Balaji and Cyriel Minkenberg}, title = {The {PERCS} High-Performance Interconnect}, booktitle = {{IEEE} 18th Annual Symposium on High Performance Interconnects, {HOTI} 2010, Google Campus, Mountain View, California, USA, August 18-20, 2010}, pages = {75--82}, publisher = {{IEEE} Computer Society}, year = {2010}, url = {https://doi.org/10.1109/HOTI.2010.16}, doi = {10.1109/HOTI.2010.16}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/ArimilliACCDDHJLLNR10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/HoeflerSL10, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, editor = {Salim Hariri and Kate Keahey}, title = {LogGOPSim: simulating large-scale applications in the LogGOPS model}, booktitle = {Proceedings of the 19th {ACM} International Symposium on High Performance Distributed Computing, {HPDC} 2010, Chicago, Illinois, USA, June 21-25, 2010}, pages = {597--604}, publisher = {{ACM}}, year = {2010}, url = {https://doi.org/10.1145/1851476.1851564}, doi = {10.1145/1851476.1851564}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/hpdc/HoeflerSL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ppopp/HoeflerSL10, author = {Torsten Hoefler and Christian Siebert and Andrew Lumsdaine}, editor = {R. Govindarajan and David A. Padua and Mary W. Hall}, title = {Scalable communication protocols for dynamic sparse data exchange}, booktitle = {Proceedings of the 15th {ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming, {PPOPP} 2010, Bangalore, India, January 9-14, 2010}, pages = {159--168}, publisher = {{ACM}}, year = {2010}, url = {https://doi.org/10.1145/1693453.1693476}, doi = {10.1145/1693453.1693476}, timestamp = {Sun, 12 Jun 2022 19:46:08 +0200}, biburl = {https://dblp.org/rec/conf/ppopp/HoeflerSL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerGTT10, author = {Torsten Hoefler and William Gropp and Rajeev Thakur and Jesper Larsson Tr{\"{a}}ff}, editor = {Rainer Keller and Edgar Gabriel and Michael M. Resch and Jack J. Dongarra}, title = {Toward Performance Models of {MPI} Implementations for Understanding Application Scaling Issues}, booktitle = {Recent Advances in the Message Passing Interface - 17th European {MPI} Users' Group Meeting, EuroMPI 2010, Stuttgart, Germany, September 12-15, 2010. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6305}, pages = {21--30}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-15646-5\_3}, doi = {10.1007/978-3-642-15646-5\_3}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerGTT10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerBBSL10, author = {Torsten Hoefler and Greg Bronevetsky and Brian Barrett and Bronis R. de Supinski and Andrew Lumsdaine}, editor = {Rainer Keller and Edgar Gabriel and Michael M. Resch and Jack J. Dongarra}, title = {Efficient {MPI} Support for Advanced Hybrid Programming Models}, booktitle = {Recent Advances in the Message Passing Interface - 17th European {MPI} Users' Group Meeting, EuroMPI 2010, Stuttgart, Germany, September 12-15, 2010. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6305}, pages = {50--61}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-15646-5\_6}, doi = {10.1007/978-3-642-15646-5\_6}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerBBSL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerG10, author = {Torsten Hoefler and Steven Gottlieb}, editor = {Rainer Keller and Edgar Gabriel and Michael M. Resch and Jack J. Dongarra}, title = {Parallel Zero-Copy Algorithms for Fast Fourier Transform and Conjugate Gradient Using {MPI} Datatypes}, booktitle = {Recent Advances in the Message Passing Interface - 17th European {MPI} Users' Group Meeting, EuroMPI 2010, Stuttgart, Germany, September 12-15, 2010. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {6305}, pages = {132--141}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-15646-5\_14}, doi = {10.1007/978-3-642-15646-5\_14}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerG10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerSL10, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {Characterizing the Influence of System Noise on Large-Scale Applications by Simulation}, booktitle = {Conference on High Performance Computing Networking, Storage and Analysis, {SC} 2010, New Orleans, LA, USA, November 13-19, 2010}, pages = {1--11}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/SC.2010.12}, doi = {10.1109/SC.2010.12}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/HoeflerSL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ppl/HoeflerSL09, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {The Effect of Network Noise on Large-Scale Collective Communications}, journal = {Parallel Process. Lett.}, volume = {19}, number = {4}, pages = {573--593}, year = {2009}, url = {https://doi.org/10.1142/S0129626409000420}, doi = {10.1142/S0129626409000420}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ppl/HoeflerSL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/simpra/HoeflerSL09, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {LogGP in theory and practice - An in-depth analysis of modern interconnection networks and benchmarking methods for collective operations}, journal = {Simul. Model. Pract. Theory}, volume = {17}, number = {9}, pages = {1511--1521}, year = {2009}, url = {https://doi.org/10.1016/j.simpat.2009.06.007}, doi = {10.1016/J.SIMPAT.2009.06.007}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/simpra/HoeflerSL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hipc/KambadurGHL09, author = {Prabhanjan Kambadur and Anshul Gupta and Torsten Hoefler and Andrew Lumsdaine}, editor = {Yuanyuan Yang and Manish Parashar and Rajeev Muralidhar and Viktor K. Prasanna}, title = {Demand-driven execution of static directed acyclic graphs using task parallelism}, booktitle = {16th International Conference on High Performance Computing, HiPC 2009, December 16-19, 2009, Kochi, India, Proceedings}, pages = {284--293}, publisher = {{IEEE} Computer Society}, year = {2009}, url = {https://doi.org/10.1109/HIPC.2009.5433201}, doi = {10.1109/HIPC.2009.5433201}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hipc/KambadurGHL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/HoeflerSL09, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, editor = {Keren Bergman and Ron Brightwell and Fabrizio Petrini and Head Bubba}, title = {Optimized Routing for Large-Scale InfiniBand Networks}, booktitle = {17th {IEEE} Symposium on High Performance Interconnects, {HOTI} 2009, New York, New York, USA, August 25-27, 2009}, pages = {103--111}, publisher = {{IEEE} Computer Society}, year = {2009}, url = {https://doi.org/10.1109/HOTI.2009.9}, doi = {10.1109/HOTI.2009.9}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/HoeflerSL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icpp/HoeflerSL09, author = {Torsten Hoefler and Christian Siebert and Andrew Lumsdaine}, title = {Group Operation Assembly Language - {A} Flexible Way to Express Collective Communication}, booktitle = {{ICPP} 2009, International Conference on Parallel Processing, Vienna, Austria, 22-25 September 2009}, pages = {574--581}, publisher = {{IEEE} Computer Society}, year = {2009}, url = {https://doi.org/10.1109/ICPP.2009.70}, doi = {10.1109/ICPP.2009.70}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icpp/HoeflerSL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerSL09, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {A power-aware, application-based performance study of modern commodity cluster interconnection networks}, booktitle = {23rd {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2009, Rome, Italy, May 23-29, 2009}, pages = {1--7}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IPDPS.2009.5160891}, doi = {10.1109/IPDPS.2009.5160891}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerSL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerSL09a, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {The impact of network noise at large-scale communication performance}, booktitle = {23rd {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2009, Rome, Italy, May 23-29, 2009}, pages = {1--8}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IPDPS.2009.5161095}, doi = {10.1109/IPDPS.2009.5161095}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerSL09a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerT09, author = {Torsten Hoefler and Jesper Larsson Tr{\"{a}}ff}, title = {Sparse collective operations for {MPI}}, booktitle = {23rd {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2009, Rome, Italy, May 23-29, 2009}, pages = {1--8}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IPDPS.2009.5160935}, doi = {10.1109/IPDPS.2009.5160935}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerT09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/KaiserHBB09, author = {Christian Kaiser and Torsten Hoefler and Boris Bierbaum and Thomas Bemmerl}, title = {Implementation and analysis of nonblocking collective operations on {SCI} networks}, booktitle = {23rd {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2009, Rome, Italy, May 23-29, 2009}, pages = {1--7}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IPDPS.2009.5160892}, doi = {10.1109/IPDPS.2009.5160892}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/KaiserHBB09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerLD09, author = {Torsten Hoefler and Andrew Lumsdaine and Jack J. Dongarra}, editor = {Matti Ropo and Jan Westerholm and Jack J. Dongarra}, title = {Towards Efficient MapReduce Using {MPI}}, booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface, 16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September 7-10, 2009. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {5759}, pages = {240--249}, publisher = {Springer}, year = {2009}, url = {https://doi.org/10.1007/978-3-642-03770-2\_30}, doi = {10.1007/978-3-642-03770-2\_30}, timestamp = {Tue, 14 May 2019 10:00:52 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerLD09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/arcs/SchneiderHWMR08, author = {Timo Schneider and Torsten Hoefler and Simon Wunderlich and Torsten Mehlan and Wolfgang Rehm}, editor = {Wolfgang E. Nagel and Rolf Hoffmann and Andreas Koch}, title = {An Optimized {ZGEMM} Implementation for the Cell {BE}}, booktitle = {9th Workshop on Parallel Systems and Algorithms {(PASA)} held at the 21st Conference on the Architecture of Computing Systems (ARCS), February 26th, 2008, in Dresden, Germany}, series = {{LNI}}, volume = {{P-124}}, pages = {113--122}, publisher = {{GI}}, year = {2008}, url = {https://dl.gi.de/handle/20.500.12116/22270}, timestamp = {Tue, 04 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/arcs/SchneiderHWMR08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ccgrid/HoeflerL08, author = {Torsten Hoefler and Andrew Lumsdaine}, title = {Overlapping Communication and Computation with High Level Communication Routines}, booktitle = {8th {IEEE} International Symposium on Cluster Computing and the Grid (CCGrid 2008), 19-22 May 2008, Lyon, France}, pages = {572--577}, publisher = {{IEEE} Computer Society}, year = {2008}, url = {https://doi.org/10.1109/CCGRID.2008.15}, doi = {10.1109/CCGRID.2008.15}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ccgrid/HoeflerL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cluster/HoeflerSL08, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {Multistage switches are not crossbars: Effects of static routing in high-performance networks}, booktitle = {Proceedings of the 2008 {IEEE} International Conference on Cluster Computing, 29 September - 1 October 2008, Tsukuba, Japan}, pages = {116--125}, publisher = {{IEEE} Computer Society}, year = {2008}, url = {https://doi.org/10.1109/CLUSTR.2008.4663762}, doi = {10.1109/CLUSTR.2008.4663762}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cluster/HoeflerSL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cluster/HoeflerL08, author = {Torsten Hoefler and Andrew Lumsdaine}, title = {Message progression in parallel computing - to thread or not to thread?}, booktitle = {Proceedings of the 2008 {IEEE} International Conference on Cluster Computing, 29 September - 1 October 2008, Tsukuba, Japan}, pages = {213--222}, publisher = {{IEEE} Computer Society}, year = {2008}, url = {https://doi.org/10.1109/CLUSTR.2008.4663774}, doi = {10.1109/CLUSTR.2008.4663774}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cluster/HoeflerL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hoti/GeoffrayH08, author = {Patrick Geoffray and Torsten Hoefler}, title = {Adaptive Routing Strategies for Modern High Performance Networks}, booktitle = {16th Annual {IEEE} Symposium on High Performance Interconnects {(HOTI} 2008), 26-28 August 2008, Stanford, CA, {USA}}, pages = {165--172}, publisher = {{IEEE} Computer Society}, year = {2008}, url = {https://doi.org/10.1109/HOTI.2008.21}, doi = {10.1109/HOTI.2008.21}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/hoti/GeoffrayH08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerL08, author = {Torsten Hoefler and Andrew Lumsdaine}, title = {Optimizing non-blocking collective operations for infiniband}, booktitle = {22nd {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2008, Miami, Florida USA, April 14-18, 2008}, pages = {1--8}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/IPDPS.2008.4536138}, doi = {10.1109/IPDPS.2008.4536138}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerSL08, author = {Torsten Hoefler and Timo Schneider and Andrew Lumsdaine}, title = {Accurately measuring collective operations at massive scale}, booktitle = {22nd {IEEE} International Symposium on Parallel and Distributed Processing, {IPDPS} 2008, Miami, Florida USA, April 14-18, 2008}, pages = {1--8}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/IPDPS.2008.4536494}, doi = {10.1109/IPDPS.2008.4536494}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerSL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerLL08, author = {Torsten Hoefler and Florian Lorenzen and Andrew Lumsdaine}, editor = {Alexey L. Lastovetsky and M. Tahar Kechadi and Jack J. Dongarra}, title = {Sparse Non-blocking Collectives in Quantum Mechanical Calculations}, booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface, 15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September 7-10, 2008. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {5205}, pages = {55--63}, publisher = {Springer}, year = {2008}, url = {https://doi.org/10.1007/978-3-540-87475-1\_13}, doi = {10.1007/978-3-540-87475-1\_13}, timestamp = {Mon, 03 Jan 2022 22:32:15 +0100}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerLL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerSGL08, author = {Torsten Hoefler and Maraike Schellmann and Sergei Gorlatch and Andrew Lumsdaine}, editor = {Alexey L. Lastovetsky and M. Tahar Kechadi and Jack J. Dongarra}, title = {Communication Optimization for Medical Image Reconstruction Algorithms}, booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface, 15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September 7-10, 2008. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {5205}, pages = {75--83}, publisher = {Springer}, year = {2008}, url = {https://doi.org/10.1007/978-3-540-87475-1\_15}, doi = {10.1007/978-3-540-87475-1\_15}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerSGL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/spaa/HoeflerGL08, author = {Torsten Hoefler and Peter Gottschling and Andrew Lumsdaine}, editor = {Friedhelm Meyer auf der Heide and Nir Shavit}, title = {Leveraging non-blocking collective communication in high-performance applications}, booktitle = {{SPAA} 2008: Proceedings of the 20th Annual {ACM} Symposium on Parallelism in Algorithms and Architectures, Munich, Germany, June 14-16, 2008}, pages = {113--115}, publisher = {{ACM}}, year = {2008}, url = {https://doi.org/10.1145/1378533.1378554}, doi = {10.1145/1378533.1378554}, timestamp = {Wed, 21 Nov 2018 11:14:43 +0100}, biburl = {https://dblp.org/rec/conf/spaa/HoeflerGL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pc/HoeflerGLR07, author = {Torsten Hoefler and Peter Gottschling and Andrew Lumsdaine and Wolfgang Rehm}, title = {Optimizing a conjugate gradient solver with non-blocking collective operations}, journal = {Parallel Comput.}, volume = {33}, number = {9}, pages = {624--633}, year = {2007}, url = {https://doi.org/10.1016/j.parco.2007.06.006}, doi = {10.1016/J.PARCO.2007.06.006}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pc/HoeflerGLR07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpcc/HoeflerMLR07, author = {Torsten Hoefler and Torsten Mehlan and Andrew Lumsdaine and Wolfgang Rehm}, editor = {Ronald H. Perrott and Barbara M. Chapman and Jaspal Subhlok and Rodrigo Fernandes de Mello and Laurence Tianruo Yang}, title = {Netgauge: {A} Network Performance Measurement Framework}, booktitle = {High Performance Computing and Communications, Third International Conference, {HPCC} 2007, Houston, USA, September 26-28, 2007, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4782}, pages = {659--671}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-75444-2\_62}, doi = {10.1007/978-3-540-75444-2\_62}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/hpcc/HoeflerMLR07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerLR07, author = {Torsten Hoefler and Andre Lichei and Wolfgang Rehm}, title = {Low-Overhead LogGP Parameter Assessment for Modern Interconnection Networks}, booktitle = {21th International Parallel and Distributed Processing Symposium {(IPDPS} 2007), Proceedings, 26-30 March 2007, Long Beach, California, {USA}}, pages = {1--8}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/IPDPS.2007.370593}, doi = {10.1109/IPDPS.2007.370593}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerLR07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerSR07, author = {Torsten Hoefler and Christian Siebert and Wolfgang Rehm}, title = {A practically constant-time {MPI} Broadcast Algorithm for large-scale InfiniBand Clusters with Multicast}, booktitle = {21th International Parallel and Distributed Processing Symposium {(IPDPS} 2007), Proceedings, 26-30 March 2007, Long Beach, California, {USA}}, pages = {1--8}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/IPDPS.2007.370475}, doi = {10.1109/IPDPS.2007.370475}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerSR07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerKGSL07, author = {Torsten Hoefler and Prabhanjan Kambadur and Richard L. Graham and Galen M. Shipman and Andrew Lumsdaine}, editor = {Franck Cappello and Thomas H{\'{e}}rault and Jack J. Dongarra}, title = {A Case for Standard Non-blocking Collective Operations}, booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface, 14th European {PVM/MPI} User's Group Meeting, Paris, France, September 30 - October 3, 2007, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4757}, pages = {125--134}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-75416-9\_22}, doi = {10.1007/978-3-540-75416-9\_22}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerKGSL07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/HoeflerLR07, author = {Torsten Hoefler and Andrew Lumsdaine and Wolfgang Rehm}, editor = {Becky Verastegui}, title = {Implementation and performance analysis of non-blocking collective operations for {MPI}}, booktitle = {Proceedings of the {ACM/IEEE} Conference on High Performance Networking and Computing, {SC} 2007, November 10-16, 2007, Reno, Nevada, {USA}}, pages = {52}, publisher = {{ACM} Press}, year = {2007}, url = {https://doi.org/10.1145/1362622.1362692}, doi = {10.1145/1362622.1362692}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sc/HoeflerLR07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/arcs/HoeflerMMR06, author = {Torsten Hoefler and Torsten Mehlan and Frank Mietke and Wolfgang Rehm}, editor = {Wolfgang Karl and J{\"{u}}rgen Becker and Karl{-}Erwin Gro{\ss}pietsch and Christian Hochberger and Erik Maehle}, title = {Adding Low-Cost Hardware Barrier Support to Small Commodity Clusters}, booktitle = {{ARCS} 2006 - 19th International Conference on Architecture of Computing Systems, Workshops Proceedings, March 16, 2006, Frankfurt am Main, Germany}, series = {{LNI}}, volume = {{P-81}}, pages = {343--350}, publisher = {{GI}}, year = {2006}, url = {https://dl.gi.de/handle/20.500.12116/29432}, timestamp = {Tue, 04 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/arcs/HoeflerMMR06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/europar/MietkeRBMHR06, author = {Frank Mietke and Robert Rex and Robert Baumgartl and Torsten Mehlan and Torsten Hoefler and Wolfgang Rehm}, editor = {Wolfgang E. Nagel and Wolfgang V. Walter and Wolfgang Lehner}, title = {Analysis of the Memory Registration Process in the Mellanox InfiniBand Software Stack}, booktitle = {Euro-Par 2006, Parallel Processing, 12th International Euro-Par Conference, Dresden, Germany, August 28 - September 1, 2006, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4128}, pages = {124--133}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/11823285\_13}, doi = {10.1007/11823285\_13}, timestamp = {Tue, 14 May 2019 10:00:46 +0200}, biburl = {https://dblp.org/rec/conf/europar/MietkeRBMHR06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerMMR06, author = {Torsten Hoefler and Torsten Mehlan and Frank Mietke and Wolfgang Rehm}, title = {Fast barrier synchronization for InfiniBand{\texttrademark}}, booktitle = {20th International Parallel and Distributed Processing Symposium {(IPDPS} 2006), Proceedings, 25-29 April 2006, Rhodes Island, Greece}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/IPDPS.2006.1639561}, doi = {10.1109/IPDPS.2006.1639561}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerMMR06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/HoeflerMMR06a, author = {Torsten Hoefler and Torsten Mehlan and Frank Mietke and Wolfgang Rehm}, title = {LogfP - a model for small messages in InfiniBand}, booktitle = {20th International Parallel and Distributed Processing Symposium {(IPDPS} 2006), Proceedings, 25-29 April 2006, Rhodes Island, Greece}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/IPDPS.2006.1639624}, doi = {10.1109/IPDPS.2006.1639624}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/HoeflerMMR06a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ispa/HoeflerSRL06, author = {Torsten Hoefler and Jeffrey M. Squyres and Wolfgang Rehm and Andrew Lumsdaine}, editor = {Geyong Min and Beniamino Di Martino and Laurence Tianruo Yang and Minyi Guo and Gudula R{\"{u}}nger}, title = {A Case for Non-blocking Collective Operations}, booktitle = {Frontiers of High Performance Computing and Networking - {ISPA} 2006 Workshops, {ISPA} 2006 International Workshops, FHPCN, XHPC, S-GRACE, GridGIS, HPC-GTP, PDCE, ParDMCom, WOMP, ISDF, and UPWN, Sorrento, Italy, December 4-7, 2006, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4331}, pages = {155--164}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/11942634\_17}, doi = {10.1007/11942634\_17}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ispa/HoeflerSRL06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/parelec/MehlanSHMR06, author = {Torsten Mehlan and Jochen Strunk and Torsten Hoefler and Frank Mietke and Wolfgang Rehm}, title = {{IRS} - {A} Portable Interface for Reconfigurable Systems}, booktitle = {Fifth International Conference on Parallel Computing in Electrical Engineering {(PARELEC} 2006), 13-17 September 2006, Bialystok, Poland}, pages = {187--191}, publisher = {{IEEE} Computer Society}, year = {2006}, url = {https://doi.org/10.1109/PARELEC.2006.50}, doi = {10.1109/PARELEC.2006.50}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/parelec/MehlanSHMR06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/parelec/HoeflerVMMR06, author = {Torsten Hoefler and Carsten Viertel and Torsten Mehlan and Frank Mietke and Wolfgang Rehm}, title = {Assessing Single-Message and Multi-Node Communication Performance of InfiniBand}, booktitle = {Fifth International Conference on Parallel Computing in Electrical Engineering {(PARELEC} 2006), 13-17 September 2006, Bialystok, Poland}, pages = {227--232}, publisher = {{IEEE} Computer Society}, year = {2006}, url = {https://doi.org/10.1109/PARELEC.2006.16}, doi = {10.1109/PARELEC.2006.16}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/parelec/HoeflerVMMR06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pvm/HoeflerGRL06, author = {Torsten Hoefler and Peter Gottschling and Wolfgang Rehm and Andrew Lumsdaine}, editor = {Bernd Mohr and Jesper Larsson Tr{\"{a}}ff and Joachim Worringen and Jack J. Dongarra}, title = {Optimizing a Conjugate Gradient Solver with Non-Blocking Collective Operations}, booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface, 13th European {PVM/MPI} User's Group Meeting, Bonn, Germany, September 17-20, 2006, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4192}, pages = {374--382}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/11846802\_52}, doi = {10.1007/11846802\_52}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pvm/HoeflerGRL06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icppw/HoeflerCMMR05, author = {Torsten Hoefler and Lavinio Cerquetti and Torsten Mehlan and Frank Mietke and Wolfgang Rehm}, title = {A Practical Approach to the Rating of Barrier Algorithms Using the LogP Model and Open {MPI}}, booktitle = {34th International Conference on Parallel Processing Workshops {(ICPP} 2005 Workshops), 14-17 June 2005, Oslo, Norway}, pages = {562--569}, publisher = {{IEEE} Computer Society}, year = {2005}, url = {https://doi.org/10.1109/ICPPW.2005.14}, doi = {10.1109/ICPPW.2005.14}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icppw/HoeflerCMMR05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.