Search dblp for Publications

export results for "Training Sparse Neural Networks."

 download as .bib file

@inproceedings{DBLP:conf/wsdm/WangZW24,
  author       = {Fali Wang and
                  Tianxiang Zhao and
                  Suhang Wang},
  editor       = {Luz Angelica Caudillo{-}Mata and
                  Silvio Lattanzi and
                  Andr{\'{e}}s Mu{\~{n}}oz Medina and
                  Leman Akoglu and
                  Aristides Gionis and
                  Sergei Vassilvitskii},
  title        = {Distribution Consistency based Self-Training for Graph Neural Networks
                  with Sparse Labels},
  booktitle    = {Proceedings of the 17th {ACM} International Conference on Web Search
                  and Data Mining, {WSDM} 2024, Merida, Mexico, March 4-8, 2024},
  pages        = {712--720},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3616855.3635793},
  doi          = {10.1145/3616855.3635793},
  timestamp    = {Mon, 01 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wsdm/WangZW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-10394,
  author       = {Fali Wang and
                  Tianxiang Zhao and
                  Suhang Wang},
  title        = {Distribution Consistency based Self-Training for Graph Neural Networks
                  with Sparse Labels},
  journal      = {CoRR},
  volume       = {abs/2401.10394},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.10394},
  doi          = {10.48550/ARXIV.2401.10394},
  eprinttype    = {arXiv},
  eprint       = {2401.10394},
  timestamp    = {Fri, 02 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-10394.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-11025,
  author       = {Junbo Li and
                  Zichen Miao and
                  Qiang Qiu and
                  Ruqi Zhang},
  title        = {Training Bayesian Neural Networks with Sparse Subspace Variational
                  Inference},
  journal      = {CoRR},
  volume       = {abs/2402.11025},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.11025},
  doi          = {10.48550/ARXIV.2402.11025},
  eprinttype    = {arXiv},
  eprint       = {2402.11025},
  timestamp    = {Mon, 26 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-11025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neuromorphic/PetschenigL23,
  author       = {Horst Petschenig and
                  Robert Legenstein},
  title        = {Quantized rewiring: hardware-aware training of sparse deep neural
                  networks},
  journal      = {Neuromorph. Comput. Eng.},
  volume       = {3},
  number       = {2},
  pages        = {24006},
  year         = {2023},
  url          = {https://doi.org/10.1088/2634-4386/accd8f},
  doi          = {10.1088/2634-4386/ACCD8F},
  timestamp    = {Sat, 13 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/neuromorphic/PetschenigL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/date/FangSZW23,
  author       = {Chao Fang and
                  Wei Sun and
                  Aojun Zhou and
                  Zhongfeng Wang},
  title        = {{CEST:} Computation-Efficient {N:M} Sparse Training for Deep Neural
                  Networks},
  booktitle    = {Design, Automation {\&} Test in Europe Conference {\&} Exhibition,
                  {DATE} 2023, Antwerp, Belgium, April 17-19, 2023},
  pages        = {1--2},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.23919/DATE56975.2023.10137121},
  doi          = {10.23919/DATE56975.2023.10137121},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/date/FangSZW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/AliNN23,
  author       = {Murtiza Ali and
                  Aditya Arie Nugraha and
                  Karan Nathwani},
  title        = {Exploiting Sparse Recovery Algorithms for Semi-Supervised Training
                  of Deep Neural Networks for Direction-of-Arrival Estimation},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10095717},
  doi          = {10.1109/ICASSP49357.2023.10095717},
  timestamp    = {Sun, 05 Nov 2023 16:51:21 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/AliNN23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiuCZZ0H23,
  author       = {Zirui Liu and
                  Shengyuan Chen and
                  Kaixiong Zhou and
                  Daochen Zha and
                  Xiao Huang and
                  Xia Hu},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {{RSC:} Accelerate Graph Neural Networks Training via Randomized Sparse
                  Computations},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {21951--21968},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/liu23ad.html},
  timestamp    = {Tue, 30 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LiuCZZ0H23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/NikdanPIKA23,
  author       = {Mahdi Nikdan and
                  Tommaso Pegolotti and
                  Eugenia Iofinova and
                  Eldar Kurtic and
                  Dan Alistarh},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {SparseProp: Efficient Sparse Backpropagation for Faster Training of
                  Neural Networks at the Edge},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {26215--26227},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/nikdan23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/NikdanPIKA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/FanWC23,
  author       = {Ruibo Fan and
                  Wei Wang and
                  Xiaowen Chu},
  title        = {Fast Sparse {GPU} Kernels for Accelerated Training of Graph Neural
                  Networks},
  booktitle    = {{IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2023, St. Petersburg, FL, USA, May 15-19, 2023},
  pages        = {501--511},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/IPDPS54959.2023.00057},
  doi          = {10.1109/IPDPS54959.2023.00057},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/FanWC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ksem/YaoWGSLWWC23,
  author       = {Tiechui Yao and
                  Jue Wang and
                  Junyu Gu and
                  Yumeng Shi and
                  Fang Liu and
                  Xiaoguang Wang and
                  Yangang Wang and
                  Xuebin Chi},
  editor       = {Zhi Jin and
                  Yuncheng Jiang and
                  Robert Andrei Buchmann and
                  Yaxin Bi and
                  Ana{-}Maria Ghiran and
                  Wenjun Ma},
  title        = {A Sparse Matrix Optimization Method for Graph Neural Networks Training},
  booktitle    = {Knowledge Science, Engineering and Management - 16th International
                  Conference, {KSEM} 2023, Guangzhou, China, August 16-18, 2023, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {14117},
  pages        = {114--123},
  publisher    = {Springer},
  year         = {2023},
  url          = {https://doi.org/10.1007/978-3-031-40283-8\_11},
  doi          = {10.1007/978-3-031-40283-8\_11},
  timestamp    = {Fri, 18 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ksem/YaoWGSLWWC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Engelken23,
  author       = {Rainer Engelken},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {SparseProp: Efficient Event-Based Simulation and Training of Sparse
                  Recurrent Spiking Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/0b443d358a391166d1fbf551fb53de02-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Engelken23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-04852,
  author       = {Mahdi Nikdan and
                  Tommaso Pegolotti and
                  Eugenia Iofinova and
                  Eldar Kurtic and
                  Dan Alistarh},
  title        = {SparseProp: Efficient Sparse Backpropagation for Faster Training of
                  Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2302.04852},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.04852},
  doi          = {10.48550/ARXIV.2302.04852},
  eprinttype    = {arXiv},
  eprint       = {2302.04852},
  timestamp    = {Mon, 13 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-04852.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-06941,
  author       = {Abhisek Kundu and
                  Naveen K. Mellempudi and
                  Dharma Teja Vooturi and
                  Bharat Kaul and
                  Pradeep Dubey},
  title        = {{AUTOSPARSE:} Towards Automated Sparse Training of Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2304.06941},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.06941},
  doi          = {10.48550/ARXIV.2304.06941},
  eprinttype    = {arXiv},
  eprint       = {2304.06941},
  timestamp    = {Wed, 19 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-06941.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-17216,
  author       = {Rainer Engelken},
  title        = {SparseProp: Efficient Event-Based Simulation and Training of Sparse
                  Recurrent Spiking Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2312.17216},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.17216},
  doi          = {10.48550/ARXIV.2312.17216},
  eprinttype    = {arXiv},
  eprint       = {2312.17216},
  timestamp    = {Wed, 10 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-17216.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/AtashgahiPLMVP22,
  author       = {Zahra Atashgahi and
                  Joost Pieterse and
                  Shiwei Liu and
                  Decebal Constantin Mocanu and
                  Raymond N. J. Veldhuis and
                  Mykola Pechenizkiy},
  title        = {A brain-inspired algorithm for training highly sparse neural networks},
  journal      = {Mach. Learn.},
  volume       = {111},
  number       = {12},
  pages        = {4411--4452},
  year         = {2022},
  url          = {https://doi.org/10.1007/s10994-022-06266-w},
  doi          = {10.1007/S10994-022-06266-W},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/AtashgahiPLMVP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpp/LiLL0YD22,
  author       = {Shengwei Li and
                  Zhiquan Lai and
                  Dongsheng Li and
                  Yiming Zhang and
                  Xiangyu Ye and
                  Yabo Duan},
  title        = {EmbRace: Accelerating Sparse Communication for Distributed Training
                  of Deep Neural Networks},
  booktitle    = {Proceedings of the 51st International Conference on Parallel Processing,
                  {ICPP} 2022, Bordeaux, France, 29 August 2022 - 1 September 2022},
  pages        = {7:1--7:11},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3545008.3545011},
  doi          = {10.1145/3545008.3545011},
  timestamp    = {Tue, 31 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/LiLL0YD22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-08629,
  author       = {Chuang Liu and
                  Xueqi Ma and
                  Yibing Zhan and
                  Liang Ding and
                  Dapeng Tao and
                  Bo Du and
                  Wenbin Hu and
                  Danilo P. Mandic},
  title        = {Comprehensive Graph Gradual Pruning for Sparse Training in Graph Neural
                  Networks},
  journal      = {CoRR},
  volume       = {abs/2207.08629},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.08629},
  doi          = {10.48550/ARXIV.2207.08629},
  eprinttype    = {arXiv},
  eprint       = {2207.08629},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-08629.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-10737,
  author       = {Zirui Liu and
                  Shengyuan Chen and
                  Kaixiong Zhou and
                  Daochen Zha and
                  Xiao Huang and
                  Xia Hu},
  title        = {{RSC:} Accelerating Graph Neural Networks Training via Randomized
                  Sparse Computations},
  journal      = {CoRR},
  volume       = {abs/2210.10737},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.10737},
  doi          = {10.48550/ARXIV.2210.10737},
  eprinttype    = {arXiv},
  eprint       = {2210.10737},
  timestamp    = {Tue, 30 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-10737.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/access/LabanAEST21,
  author       = {Noureldin Laban and
                  Bassam Abdellatif and
                  Hala M. Ebeid and
                  Howida A. Shedeed and
                  Mohamed F. Tolba},
  title        = {Sparse Pixel Training of Convolutional Neural Networks for Land Cover
                  Classification},
  journal      = {{IEEE} Access},
  volume       = {9},
  pages        = {52067--52078},
  year         = {2021},
  url          = {https://doi.org/10.1109/ACCESS.2021.3069882},
  doi          = {10.1109/ACCESS.2021.3069882},
  timestamp    = {Thu, 29 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/access/LabanAEST21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nca/LiuNMMP21,
  author       = {Shiwei Liu and
                  Iftitahu Ni'mah and
                  Vlado Menkovski and
                  Decebal Constantin Mocanu and
                  Mykola Pechenizkiy},
  title        = {Efficient and effective training of sparse recurrent neural networks},
  journal      = {Neural Comput. Appl.},
  volume       = {33},
  number       = {15},
  pages        = {9625--9636},
  year         = {2021},
  url          = {https://doi.org/10.1007/s00521-021-05727-y},
  doi          = {10.1007/S00521-021-05727-Y},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nca/LiuNMMP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/CaiafaWSZ21,
  author       = {Cesar F. Caiafa and
                  Ziyao Wang and
                  Jordi Sol{\'{e}}{-}Casals and
                  Qibin Zhao},
  title        = {Learning From Incomplete Features by Simultaneous Training of Neural
                  Networks and Sparse Coding},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition Workshops,
                  {CVPR} Workshops 2021, virtual, June 19-25, 2021},
  pages        = {2621--2630},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021W/LLID/html/Caiafa\_Learning\_From\_Incomplete\_Features\_by\_Simultaneous\_Training\_of\_Neural\_Networks\_CVPRW\_2021\_paper.html},
  doi          = {10.1109/CVPRW53098.2021.00296},
  timestamp    = {Mon, 18 Jul 2022 16:47:41 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/CaiafaWSZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hpcc/YangWTSZ21,
  author       = {Jianchao Yang and
                  Mei Wen and
                  Minjin Tang and
                  Junzhong Shen and
                  Chunyuan Zhang},
  title        = {{SAI:} Self-Adjusting Incremental Quantile Estimation for Sparse Training
                  of Neural Networks on Hardware Accelerators},
  booktitle    = {2021 {IEEE} 23rd Int Conf on High Performance Computing {\&} Communications;
                  7th Int Conf on Data Science {\&} Systems; 19th Int Conf on Smart
                  City; 7th Int Conf on Dependability in Sensor, Cloud {\&} Big
                  Data Systems {\&} Application (HPCC/DSS/SmartCity/DependSys),
                  Haikou, Hainan, China, December 20-22, 2021},
  pages        = {1049--1058},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/HPCC-DSS-SmartCity-DependSys53884.2021.00165},
  doi          = {10.1109/HPCC-DSS-SMARTCITY-DEPENDSYS53884.2021.00165},
  timestamp    = {Thu, 09 Jun 2022 16:39:42 +0200},
  biburl       = {https://dblp.org/rec/conf/hpcc/YangWTSZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ics/DemirciF21,
  author       = {Gunduz Vehbi Demirci and
                  Hakan Ferhatosmanoglu},
  editor       = {Huiyang Zhou and
                  Jose Moreira and
                  Frank Mueller and
                  Yoav Etsion},
  title        = {Partitioning sparse deep neural networks for scalable training and
                  inference},
  booktitle    = {{ICS} '21: 2021 International Conference on Supercomputing, Virtual
                  Event, USA, June 14-17, 2021},
  pages        = {254--265},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3447818.3460372},
  doi          = {10.1145/3447818.3460372},
  timestamp    = {Wed, 09 Jun 2021 15:33:33 +0200},
  biburl       = {https://dblp.org/rec/conf/ics/DemirciF21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isscc/ParkLJ21,
  author       = {Jeongwoo Park and
                  Sunwoo Lee and
                  Dongsuk Jeon},
  title        = {A 40nm 4.81TFLOPS/W 8b Floating-Point Training Processor for Non-Sparse
                  Neural Networks Using Shared Exponent Bias and 24-Way Fused Multiply-Add
                  Tree},
  booktitle    = {{IEEE} International Solid-State Circuits Conference, {ISSCC} 2021,
                  San Francisco, CA, USA, February 13-22, 2021},
  pages        = {148--150},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ISSCC42613.2021.9366031},
  doi          = {10.1109/ISSCC42613.2021.9366031},
  timestamp    = {Wed, 10 Mar 2021 15:02:58 +0100},
  biburl       = {https://dblp.org/rec/conf/isscc/ParkLJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SungNR21,
  author       = {Yi{-}Lin Sung and
                  Varun Nair and
                  Colin Raffel},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Training Neural Networks with Fixed Sparse Masks},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {24193--24205},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/cb2653f548f8709598e8b5156738cc51-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SungNR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-11805,
  author       = {Gunduz Vehbi Demirci and
                  Hakan Ferhatosmanoglu},
  title        = {Partitioning sparse deep neural networks for scalable training and
                  inference},
  journal      = {CoRR},
  volume       = {abs/2104.11805},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.11805},
  eprinttype    = {arXiv},
  eprint       = {2104.11805},
  timestamp    = {Mon, 03 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-11805.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-09021,
  author       = {Lorenzo Chicchi and
                  Lorenzo Giambagli and
                  Lorenzo Buffoni and
                  Timoteo Carletti and
                  Marco Ciavarella and
                  Duccio Fanelli},
  title        = {On the training of sparse and dense deep neural networks: less parameters,
                  same performance},
  journal      = {CoRR},
  volume       = {abs/2106.09021},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.09021},
  eprinttype    = {arXiv},
  eprint       = {2106.09021},
  timestamp    = {Tue, 29 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-09021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-09132,
  author       = {Shengwei Li and
                  Zhiquan Lai and
                  Dongsheng Li and
                  Xiangyu Ye and
                  Yabo Duan},
  title        = {EmbRace: Accelerating Sparse Communication for Distributed Training
                  of {NLP} Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2110.09132},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.09132},
  eprinttype    = {arXiv},
  eprint       = {2110.09132},
  timestamp    = {Tue, 14 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-09132.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-09839,
  author       = {Yi{-}Lin Sung and
                  Varun Nair and
                  Colin Raffel},
  title        = {Training Neural Networks with Fixed Sparse Masks},
  journal      = {CoRR},
  volume       = {abs/2111.09839},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.09839},
  eprinttype    = {arXiv},
  eprint       = {2111.09839},
  timestamp    = {Mon, 22 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-09839.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dac/DaiYYCLSCZ20,
  author       = {Pengcheng Dai and
                  Jianlei Yang and
                  Xucheng Ye and
                  Xingzhou Cheng and
                  Junyu Luo and
                  Linghao Song and
                  Yiran Chen and
                  Weisheng Zhao},
  title        = {SparseTrain: Exploiting Dataflow Sparsity for Efficient Convolutional
                  Neural Networks Training},
  booktitle    = {57th {ACM/IEEE} Design Automation Conference, {DAC} 2020, San Francisco,
                  CA, USA, July 20-24, 2020},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/DAC18072.2020.9218710},
  doi          = {10.1109/DAC18072.2020.9218710},
  timestamp    = {Wed, 20 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/dac/DaiYYCLSCZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/infocom/YangLCL20,
  author       = {Yuetong Yang and
                  Zhiquan Lai and
                  Lei Cai and
                  Dongsheng Li},
  title        = {Poster Abstract: Model Average-based Distributed Training for Sparse
                  Deep Neural Networks},
  booktitle    = {39th {IEEE} Conference on Computer Communications, {INFOCOM} Workshops
                  2020, Toronto, ON, Canada, July 6-9, 2020},
  pages        = {1346--1347},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/INFOCOMWKSHPS50562.2020.9162748},
  doi          = {10.1109/INFOCOMWKSHPS50562.2020.9162748},
  timestamp    = {Tue, 14 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/infocom/YangLCL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/islped/SimCL20,
  author       = {Hyeonuk Sim and
                  Jooyeon Choi and
                  Jongeun Lee},
  editor       = {David Atienza Alonso and
                  Qinru Qiu and
                  Sherief Reda and
                  Yiran Chen},
  title        = {SparTANN: sparse training accelerator for neural networks with threshold-based
                  sparsification},
  booktitle    = {{ISLPED} '20: {ACM/IEEE} International Symposium on Low Power Electronics
                  and Design, Boston, Massachusetts, August 10-12, 2020},
  pages        = {211--216},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3370748.3406554},
  doi          = {10.1145/3370748.3406554},
  timestamp    = {Tue, 05 Jul 2022 15:18:16 +0200},
  biburl       = {https://dblp.org/rec/conf/islped/SimCL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-11316,
  author       = {Namhoon Lee and
                  Philip H. S. Torr and
                  Martin Jaggi},
  title        = {Data Parallelism in Training Sparse Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2003.11316},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.11316},
  eprinttype    = {arXiv},
  eprint       = {2003.11316},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-11316.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-13595,
  author       = {Pengcheng Dai and
                  Jianlei Yang and
                  Xucheng Ye and
                  Xingzhou Cheng and
                  Junyu Luo and
                  Linghao Song and
                  Yiran Chen and
                  Weisheng Zhao},
  title        = {SparseTrain: Exploiting Dataflow Sparsity for Efficient Convolutional
                  Neural Networks Training},
  journal      = {CoRR},
  volume       = {abs/2007.13595},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.13595},
  eprinttype    = {arXiv},
  eprint       = {2007.13595},
  timestamp    = {Wed, 20 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-13595.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-09661,
  author       = {Jonathan W. Siegel and
                  Jianhong Chen and
                  Jinchao Xu},
  title        = {Training Sparse Neural Networks using Compressed Sensing},
  journal      = {CoRR},
  volume       = {abs/2008.09661},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.09661},
  eprinttype    = {arXiv},
  eprint       = {2008.09661},
  timestamp    = {Fri, 28 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-09661.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-10183,
  author       = {Skyler Seto and
                  Martin T. Wells and
                  Wenyu Zhang},
  title        = {Hierarchical Adaptive Lasso: Learning Sparse Neural Networks with
                  Shrinkage via Single Stage Training},
  journal      = {CoRR},
  volume       = {abs/2008.10183},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.10183},
  eprinttype    = {arXiv},
  eprint       = {2008.10183},
  timestamp    = {Wed, 01 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-10183.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-14047,
  author       = {Cesar F. Caiafa and
                  Ziyao Wang and
                  Jordi Sol{\'{e}}{-}Casals and
                  Qibin Zhao},
  title        = {Learning from Incomplete Data by Simultaneous Training of Neural Networks
                  and Sparse Coding},
  journal      = {CoRR},
  volume       = {abs/2011.14047},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.14047},
  eprinttype    = {arXiv},
  eprint       = {2011.14047},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-14047.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hpec/Hasanzadeh-Mofrad19,
  author       = {Mohammad Hasanzadeh{-}Mofrad and
                  Rami G. Melhem and
                  Muhammad Yousuf Ahmad and
                  Mohammad Hammoud},
  title        = {Multithreaded Layer-wise Training of Sparse Deep Neural Networks using
                  Compressed Sparse Column},
  booktitle    = {2019 {IEEE} High Performance Extreme Computing Conference, {HPEC}
                  2019, Waltham, MA, USA, September 24-26, 2019},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/HPEC.2019.8916494},
  doi          = {10.1109/HPEC.2019.8916494},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hpec/Hasanzadeh-Mofrad19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hpec/WangHKXWZL19,
  author       = {Jianzong Wang and
                  Zhangcheng Huang and
                  Lingwei Kong and
                  Jing Xiao and
                  Pengyu Wang and
                  Lu Zhang and
                  Chao Li},
  title        = {Performance of Training Sparse Deep Neural Networks on GPUs},
  booktitle    = {2019 {IEEE} High Performance Extreme Computing Conference, {HPEC}
                  2019, Waltham, MA, USA, September 24-26, 2019},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/HPEC.2019.8916506},
  doi          = {10.1109/HPEC.2019.8916506},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hpec/WangHKXWZL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MostafaW19,
  author       = {Hesham Mostafa and
                  Xin Wang},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Parameter efficient training of deep convolutional neural networks
                  by dynamic sparse reparameterization},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {4646--4655},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/mostafa19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MostafaW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-05967,
  author       = {Hesham Mostafa and
                  Xin Wang},
  title        = {Parameter Efficient Training of Deep Convolutional Neural Networks
                  by Dynamic Sparse Reparameterization},
  journal      = {CoRR},
  volume       = {abs/1902.05967},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.05967},
  eprinttype    = {arXiv},
  eprint       = {1902.05967},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-05967.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-10732,
  author       = {Utku Evci and
                  Fabian Pedregosa and
                  Aidan N. Gomez and
                  Erich Elsen},
  title        = {The Difficulty of Training Sparse Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1906.10732},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.10732},
  eprinttype    = {arXiv},
  eprint       = {1906.10732},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-10732.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-11786,
  author       = {Matej Balog and
                  Bart van Merri{\"{e}}nboer and
                  Subhodeep Moitra and
                  Yujia Li and
                  Daniel Tarlow},
  title        = {Fast Training of Sparse Graph Neural Networks on Dense Hardware},
  journal      = {CoRR},
  volume       = {abs/1906.11786},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.11786},
  eprinttype    = {arXiv},
  eprint       = {1906.11786},
  timestamp    = {Mon, 01 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-11786.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/Xia18,
  author       = {Xiao{-}Lei Xia},
  title        = {Training sparse least squares support vector machines by the {QR}
                  decomposition},
  journal      = {Neural Networks},
  volume       = {106},
  pages        = {175--184},
  year         = {2018},
  url          = {https://doi.org/10.1016/j.neunet.2018.07.008},
  doi          = {10.1016/J.NEUNET.2018.07.008},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nn/Xia18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-04222,
  author       = {Xiaodong Jia and
                  Liang Zhao and
                  Lian Zhang and
                  Juncai He and
                  Jinchao Xu},
  title        = {Modified Regularized Dual Averaging Method for Training Sparse Convolutional
                  Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1807.04222},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.04222},
  eprinttype    = {arXiv},
  eprint       = {1807.04222},
  timestamp    = {Wed, 15 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-04222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/SrinivasSB17,
  author       = {Suraj Srinivas and
                  Akshayvarun Subramanya and
                  R. Venkatesh Babu},
  title        = {Training Sparse Neural Networks},
  booktitle    = {2017 {IEEE} Conference on Computer Vision and Pattern Recognition
                  Workshops, {CVPR} Workshops 2017, Honolulu, HI, USA, July 21-26, 2017},
  pages        = {455--462},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/CVPRW.2017.61},
  doi          = {10.1109/CVPRW.2017.61},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/SrinivasSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icann/DeySCB17,
  author       = {Sourya Dey and
                  Yinan Shao and
                  Keith M. Chugg and
                  Peter A. Beerel},
  editor       = {Alessandra Lintas and
                  Stefano Rovetta and
                  Paul F. M. J. Verschure and
                  Alessandro E. P. Villa},
  title        = {Accelerating Training of Deep Neural Networks via Sparse Edge Processing},
  booktitle    = {Artificial Neural Networks and Machine Learning - {ICANN} 2017 - 26th
                  International Conference on Artificial Neural Networks, Alghero, Italy,
                  September 11-14, 2017, Proceedings, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {10613},
  pages        = {273--280},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-68600-4\_32},
  doi          = {10.1007/978-3-319-68600-4\_32},
  timestamp    = {Sun, 25 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icann/DeySCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HanPNMGTEVPTCD17,
  author       = {Song Han and
                  Jeff Pool and
                  Sharan Narang and
                  Huizi Mao and
                  Enhao Gong and
                  Shijian Tang and
                  Erich Elsen and
                  Peter Vajda and
                  Manohar Paluri and
                  John Tran and
                  Bryan Catanzaro and
                  William J. Dally},
  title        = {{DSD:} Dense-Sparse-Dense Training for Deep Neural Networks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=HyoST\_9xl},
  timestamp    = {Fri, 20 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/HanPNMGTEVPTCD17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MocanuMSNGL17,
  author       = {Decebal Constantin Mocanu and
                  Elena Mocanu and
                  Peter Stone and
                  Phuong H. Nguyen and
                  Madeleine Gibescu and
                  Antonio Liotta},
  title        = {Evolutionary Training of Sparse Artificial Neural Networks: {A} Network
                  Science Perspective},
  journal      = {CoRR},
  volume       = {abs/1707.04780},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.04780},
  eprinttype    = {arXiv},
  eprint       = {1707.04780},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MocanuMSNGL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-01343,
  author       = {Sourya Dey and
                  Yinan Shao and
                  Keith M. Chugg and
                  Peter A. Beerel},
  title        = {Accelerating Training of Deep Neural Networks via Sparse Edge Processing},
  journal      = {CoRR},
  volume       = {abs/1711.01343},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.01343},
  eprinttype    = {arXiv},
  eprint       = {1711.01343},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-01343.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HanPNMTECTD16,
  author       = {Song Han and
                  Jeff Pool and
                  Sharan Narang and
                  Huizi Mao and
                  Shijian Tang and
                  Erich Elsen and
                  Bryan Catanzaro and
                  John Tran and
                  William J. Dally},
  title        = {{DSD:} Regularizing Deep Neural Networks with Dense-Sparse-Dense Training
                  Flow},
  journal      = {CoRR},
  volume       = {abs/1607.04381},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.04381},
  eprinttype    = {arXiv},
  eprint       = {1607.04381},
  timestamp    = {Fri, 20 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/HanPNMTECTD16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SrinivasSB16,
  author       = {Suraj Srinivas and
                  Akshayvarun Subramanya and
                  R. Venkatesh Babu},
  title        = {Training Sparse Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1611.06694},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.06694},
  eprinttype    = {arXiv},
  eprint       = {1611.06694},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SrinivasSB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/SedghiA14,
  author       = {Hanie Sedghi and
                  Anima Anandkumar},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Provable Methods for Training Neural Networks with Sparse Connectivity},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.2693},
  timestamp    = {Wed, 17 Jul 2019 10:40:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SedghiA14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijon/Giustolisi04,
  author       = {Orazio Giustolisi},
  title        = {Sparse solution in training artificial neural networks},
  journal      = {Neurocomputing},
  volume       = {56},
  pages        = {285--304},
  year         = {2004},
  url          = {https://doi.org/10.1016/j.neucom.2003.09.005},
  doi          = {10.1016/J.NEUCOM.2003.09.005},
  timestamp    = {Tue, 06 Jun 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijon/Giustolisi04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/fskd/LerTC02,
  author       = {Y. H. Ler and
                  Mike Turega and
                  R. A. Cottis},
  editor       = {Lipo Wang and
                  Saman K. Halgamuge and
                  Xin Yao},
  title        = {Training Neural Networks to Produce Smooth Interpolations Between
                  Sparsely distributed Data Points},
  booktitle    = {FSDK'02, Proceedings of the 1st International Conference on Fuzzy
                  Systems and Knowledge Discovery: Computational Intelligence for the
                  E-Age, 2 Volumes, November 18-22, 2002, Orchid Country Club, Singapore},
  pages        = {677--681},
  year         = {2002},
  timestamp    = {Mon, 22 May 2017 14:08:56 +0200},
  biburl       = {https://dblp.org/rec/conf/fskd/LerTC02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics