From f974f7ba7b7fe0c78fe4298956cde7d02fbc1605 Mon Sep 17 00:00:00 2001 From: Vijay Janapa Reddi Date: Tue, 7 May 2024 11:28:13 -0400 Subject: [PATCH] BetterBib fix betterbib update -i -b contents/robust_ai/robust_ai.bib --- contents/robust_ai/robust_ai.bib | 1411 +++++++++++++++++------------- 1 file changed, 811 insertions(+), 600 deletions(-) diff --git a/contents/robust_ai/robust_ai.bib b/contents/robust_ai/robust_ai.bib index 94b429b8..3283e3b5 100644 --- a/contents/robust_ai/robust_ai.bib +++ b/contents/robust_ai/robust_ai.bib @@ -1,753 +1,964 @@ -@article{ahmadilivani2024systematic, -title={A systematic literature review on hardware reliability assessment methods for deep neural networks}, -author={Ahmadilivani, Mohammad Hasan and Taheri, Mahdi and Raik, Jaan and Daneshtalab, Masoud and Jenihhin, Maksim}, -journal={ACM Computing Surveys}, -volume={56}, -number={6}, -pages={1--39}, -year={2024}, -publisher={ACM New York, NY} +%comment{This file was created with betterbib v5.0.11.} + + +@inproceedings{addepalli2020towards, + author = {Addepalli, Sravanti and Vivek, B. S. and Baburaj, Arya and Sriramanan, Gaurang and Venkatesh Babu, R.}, + title = {Towards Achieving Adversarial Robustness by Enforcing Feature Consistency Across Bit Planes}, + year = {2020}, + booktitle = {2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, + pages = {1020--1029}, + doi = {10.1109/cvpr42600.2020.00110}, + source = {Crossref}, + url = {https://doi.org/10.1109/cvpr42600.2020.00110}, + publisher = {IEEE}, + month = jun, } -@article{zhang2008distribution, -title={On the distribution of software faults}, -author={Zhang, Hongyu}, -journal={IEEE Transactions on Software Engineering}, -volume={34}, -number={2}, -pages={301--302}, -year={2008}, -publisher={IEEE} +@article{ahmadilivani2024systematic, + author = {Ahmadilivani, Mohammad Hasan and Taheri, Mahdi and Raik, Jaan and Daneshtalab, Masoud and Jenihhin, Maksim}, + title = {A Systematic Literature Review on Hardware Reliability Assessment Methods for Deep Neural Networks}, + year = {2024}, + journal = {ACM Comput. Surv.}, + publisher = {Association for Computing Machinery (ACM)}, + volume = {56}, + number = {6}, + pages = {1--39}, + doi = {10.1145/3638242}, + source = {Crossref}, + url = {https://doi.org/10.1145/3638242}, + issn = {0360-0300, 1557-7341}, + month = jan, } -@article{dixit2021silent, -title={Silent data corruptions at scale}, -author={Dixit, Harish Dattatraya and Pendharkar, Sneha and Beadon, Matt and Mason, Chris and Chakravarthy, Tejasvi and Muthiah, Bharath and Sankar, Sriram}, -journal={arXiv preprint arXiv:2102.11245}, -year={2021} +@article{arifeen2020approximate, + author = {Arifeen, Tooba and Hassan, Abdus Sami and Lee, Jeong-A}, + title = {Approximate Triple Modular Redundancy: {A} Survey}, + year = {2020}, + journal = {\#IEEE\_O\_ACC\#}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {8}, + pages = {139851--139867}, + doi = {10.1109/access.2020.3012673}, + source = {Crossref}, + url = {https://doi.org/10.1109/access.2020.3012673}, + issn = {2169-3536}, } -@inproceedings{jha2019ml, -title={Ml-based fault injection for autonomous vehicles: A case for bayesian fault injection}, -author={Jha, Saurabh and Banerjee, Subho and Tsai, Timothy and Hari, Siva KS and Sullivan, Michael B and Kalbarczyk, Zbigniew T and Keckler, Stephen W and Iyer, Ravishankar K}, -booktitle={2019 49th annual IEEE/IFIP international conference on dependable systems and networks (DSN)}, -pages={112--124}, -year={2019}, -organization={IEEE} +@article{bai2021recent, + author = {Bai, Tao and Luo, Jinqi and Zhao, Jun and Wen, Bihan and Wang, Qian}, + title = {Recent advances in adversarial training for adversarial robustness}, + year = {2021}, + journal = {arXiv preprint arXiv:2102.01356}, } -@inproceedings{li2017understanding, -title={Understanding error propagation in deep learning neural network (DNN) accelerators and applications}, -author={Li, Guanpeng and Hari, Siva Kumar Sastry and Sullivan, Michael and Tsai, Timothy and Pattabiraman, Karthik and Emer, Joel and Keckler, Stephen W}, -booktitle={Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis}, -pages={1--12}, -year={2017} +@inproceedings{bannon2019computer, + author = {Bannon, Pete and Venkataramanan, Ganesh and Sarma, Debjit Das and Talpes, Emil}, + title = {Computer and Redundancy Solution for the Full Self-Driving Computer}, + year = {2019}, + booktitle = {2019 IEEE Hot Chips 31 Symposium (HCS)}, + pages = {1--22}, + organization = {IEEE Computer Society}, + doi = {10.1109/hotchips.2019.8875645}, + source = {Crossref}, + url = {https://doi.org/10.1109/hotchips.2019.8875645}, + publisher = {IEEE}, + month = aug, } -@inproceedings{mukherjee2005soft, -title={The soft error problem: An architectural perspective}, -author={Mukherjee, Shubhendu S and Emer, Joel and Reinhardt, Steven K}, -booktitle={11th International Symposium on High-Performance Computer Architecture}, -pages={243--247}, -year={2005}, -organization={IEEE} +@article{beaton1974fitting, + author = {Beaton, Albert E. and Tukey, John W.}, + title = {The Fitting of Power Series, Meaning Polynomials, Illustrated on Band-Spectroscopic Data}, + year = {1974}, + journal = {Technometrics}, + publisher = {JSTOR}, + volume = {16}, + number = {2}, + pages = {147}, + doi = {10.2307/1267936}, + source = {Crossref}, + url = {https://doi.org/10.2307/1267936}, + issn = {0040-1706}, + month = may, } -@inproceedings{hong2019terminal, -title={Terminal brain damage: Exposing the graceless degradation in deep neural networks under hardware fault attacks}, -author={Hong, Sanghyun and Frigo, Pietro and Kaya, Yi{\u{g}}itcan and Giuffrida, Cristiano and DumitraČ™, Tudor}, -booktitle={28th USENIX Security Symposium (USENIX Security 19)}, -pages={497--514}, -year={2019} +@article{berger2014kolmogorov, + author = {Berger, Vance W and Zhou, YanYan}, + title = {Kolmogorov{\textendash}smirnov test: {Overview}}, + year = {2014}, + journal = {Wiley statsref: Statistics reference online}, + publisher = {Wiley Online Library}, } -@inproceedings{he2023understanding, -title={Understanding and mitigating hardware failures in deep learning training systems}, -author={He, Yi and Hutton, Mike and Chan, Steven and De Gruijl, Robert and Govindaraju, Rama and Patil, Nishant and Li, Yanjing}, -booktitle={Proceedings of the 50th Annual International Symposium on Computer Architecture}, -pages={1--16}, -year={2023} +@article{binkert2011gem5, + author = {Binkert, Nathan and Beckmann, Bradford and Black, Gabriel and Reinhardt, Steven K. and Saidi, Ali and Basu, Arkaprava and Hestness, Joel and Hower, Derek R. and Krishna, Tushar and Sardashti, Somayeh and Sen, Rathijit and Sewell, Korey and Shoaib, Muhammad and Vaish, Nilay and Hill, Mark D. and Wood, David A.}, + title = {The gem5 simulator}, + year = {2011}, + journal = {ACM SIGARCH Computer Architecture News}, + publisher = {Association for Computing Machinery (ACM)}, + volume = {39}, + number = {2}, + pages = {1--7}, + doi = {10.1145/2024716.2024718}, + source = {Crossref}, + url = {https://doi.org/10.1145/2024716.2024718}, + issn = {0163-5964}, + month = may, } -@inproceedings{wan2021analyzing, -title={Analyzing and improving fault tolerance of learning-based navigation systems}, -author={Wan, Zishen and Anwar, Aqeel and Hsiao, Yu-Shun and Jia, Tianyu and Reddi, Vijay Janapa and Raychowdhury, Arijit}, -booktitle={2021 58th ACM/IEEE Design Automation Conference (DAC)}, -pages={841--846}, -year={2021}, -organization={IEEE} +@article{bolchini2022fast, + author = {Bolchini, Cristiana and Cassano, Luca and Miele, Antonio and Toschi, Alessandro}, + title = {Fast and Accurate Error Simulation for {CNNs} Against Soft Errors}, + year = {2023}, + journal = {IEEE Trans. Comput.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {72}, + number = {4}, + pages = {984--997}, + doi = {10.1109/tc.2022.3184274}, + source = {Crossref}, + url = {https://doi.org/10.1109/tc.2022.3184274}, + issn = {0018-9340, 1557-9956, 2326-3814}, + month = apr, } -@inproceedings{mahmoud2020pytorchfi, -title={Pytorchfi: A runtime perturbation tool for dnns}, -author={Mahmoud, Abdulrahman and Aggarwal, Neeraj and Nobbe, Alex and Vicarte, Jose Rodrigo Sanchez and Adve, Sarita V and Fletcher, Christopher W and Frosio, Iuri and Hari, Siva Kumar Sastry}, -booktitle={2020 50th Annual IEEE/IFIP International Conference on Dependable Systems and Networks Workshops (DSN-W)}, -pages={25--31}, -year={2020}, -organization={IEEE} +@article{bushnell2002built, + author = {Bushnell, Michael L and Agrawal, Vishwani D}, + title = {Built-in self-test}, + year = {2002}, + journal = {Essentials of electronic testing for digital, memory and mixed-signal VLSI circuits}, + publisher = {Springer}, + pages = {489--548}, } -@article{hsiao2023silent, -title={Silent Data Corruption in Robot Operating System: A Case for End-to-End System-Level Fault Analysis Using Autonomous UAVs}, -author={Hsiao, Yu-Shun and Wan, Zishen and Jia, Tianyu and Ghosal, Radhika and Mahmoud, Abdulrahman and Raychowdhury, Arijit and Brooks, David and Wei, Gu-Yeon and Reddi, Vijay Janapa}, -journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems}, -year={2023}, -publisher={IEEE} +@inproceedings{carlini2017towards, + author = {Carlini, Nicholas and Wagner, David}, + title = {Towards Evaluating the Robustness of Neural Networks}, + year = {2017}, + booktitle = {2017 IEEE Symposium on Security and Privacy (SP)}, + pages = {39--57}, + organization = {Ieee}, + doi = {10.1109/sp.2017.49}, + source = {Crossref}, + url = {https://doi.org/10.1109/sp.2017.49}, + publisher = {IEEE}, + month = may, } -@inproceedings{jha2019ml, -title={Ml-based fault injection for autonomous vehicles: A case for bayesian fault injection}, -author={Jha, Saurabh and Banerjee, Subho and Tsai, Timothy and Hari, Siva KS and Sullivan, Michael B and Kalbarczyk, Zbigniew T and Keckler, Stephen W and Iyer, Ravishankar K}, -booktitle={2019 49th annual IEEE/IFIP international conference on dependable systems and networks (DSN)}, -pages={112--124}, -year={2019}, -organization={IEEE} +@article{carta2020local, + author = {Carta, Salvatore and Podda, Alessandro Sebastian and Recupero, Diego Reforgiato and Saia, Roberto}, + title = {A Local Feature Engineering Strategy to Improve Network Anomaly Detection}, + year = {2020}, + journal = {Future Internet}, + publisher = {MDPI AG}, + volume = {12}, + number = {10}, + pages = {177}, + doi = {10.3390/fi12100177}, + source = {Crossref}, + url = {https://doi.org/10.3390/fi12100177}, + issn = {1999-5903}, + month = oct, } -@inproceedings{seong2010safer, -title={SAFER: Stuck-at-fault error recovery for memories}, -author={Seong, Nak Hee and Woo, Dong Hyuk and Srinivasan, Vijayalakshmi and Rivers, Jude A and Lee, Hsien-Hsin S}, -booktitle={2010 43rd Annual IEEE/ACM International Symposium on Microarchitecture (MICRO)}, -pages={115--124}, -year={2010}, -organization={IEEE} +@article{chandola2009anomaly, + author = {Chandola, Varun and Banerjee, Arindam and Kumar, Vipin}, + title = {Anomaly detection}, + year = {2009}, + journal = {ACM Comput. Surv.}, + publisher = {Association for Computing Machinery (ACM)}, + volume = {41}, + number = {3}, + pages = {1--58}, + doi = {10.1145/1541880.1541882}, + source = {Crossref}, + url = {https://doi.org/10.1145/1541880.1541882}, + subtitle = {A survey}, + issn = {0360-0300, 1557-7341}, + month = jul, } -@inproceedings{he2023understanding, -title={Understanding Permanent Hardware Failures in Deep Learning Training Accelerator Systems}, -author={He, Yi and Li, Yanjing}, -booktitle={2023 IEEE European Test Symposium (ETS)}, -pages={1--6}, -year={2023}, -organization={IEEE} +@inproceedings{chen2020tensorfi, + author = {Chen, Zitao and Narayanan, Niranjhana and Fang, Bo and Li, Guanpeng and Pattabiraman, Karthik and DeBardeleben, Nathan}, + title = {{TensorFI:} {A} Flexible Fault Injection Framework for {TensorFlow} Applications}, + year = {2020}, + booktitle = {2020 IEEE 31st International Symposium on Software Reliability Engineering (ISSRE)}, + pages = {426--435}, + organization = {IEEE}, + doi = {10.1109/issre5003.2020.00047}, + source = {Crossref}, + url = {https://doi.org/10.1109/issre5003.2020.00047}, + publisher = {IEEE}, + month = oct, } -@inproceedings{zhang2018analyzing, -title={Analyzing and mitigating the impact of permanent faults on a systolic array based neural network accelerator}, -author={Zhang, Jeff Jun and Gu, Tianyu and Basu, Kanad and Garg, Siddharth}, -booktitle={2018 IEEE 36th VLSI Test Symposium (VTS)}, -pages={1--6}, -year={2018}, -organization={IEEE} +@inproceedings{constantinescu2008intermittent, + author = {Constantinescu, Cristian}, + title = {Intermittent faults and effects on reliability of integrated circuits}, + year = {2008}, + booktitle = {2008 Annual Reliability and Maintainability Symposium}, + pages = {370--374}, + organization = {IEEE}, + doi = {10.1109/rams.2008.4925824}, + source = {Crossref}, + url = {https://doi.org/10.1109/rams.2008.4925824}, + publisher = {IEEE}, } -@inproceedings{kim2015bamboo, -title={Bamboo ECC: Strong, safe, and flexible codes for reliable computer memory}, -author={Kim, Jungrae and Sullivan, Michael and Erez, Mattan}, -booktitle={2015 IEEE 21st International Symposium on High Performance Computer Architecture (HPCA)}, -pages={101--112}, -year={2015}, -organization={IEEE} +@article{dixit2021silent, + author = {Vangal, Sriram and Paul, Somnath and Hsu, Steven and Agarwal, Amit and Kumar, Saurabh and Krishnamurthy, Ram and Krishnamurthy, Harish and Tschanz, James and De, Vivek and Kim, Chris H.}, + title = {Wide-Range Many-Core {SoC} Design in Scaled {CMOS:} {Challenges} and Opportunities}, + year = {2021}, + journal = {IEEE Trans. Very Large Scale Integr. VLSI Syst.}, + doi = {10.1109/tvlsi.2021.3061649}, + number = {5}, + source = {Crossref}, + url = {https://doi.org/10.1109/tvlsi.2021.3061649}, + volume = {29}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + issn = {1063-8210, 1557-9999}, + pages = {843--856}, + month = may, } @article{egwutuoha2013survey, -title={A survey of fault tolerance mechanisms and checkpoint/restart implementations for high performance computing systems}, -author={Egwutuoha, Ifeanyi P and Levy, David and Selic, Bran and Chen, Shiping}, -journal={The Journal of Supercomputing}, -volume={65}, -pages={1302--1326}, -year={2013}, -publisher={Springer} + author = {Egwutuoha, Ifeanyi P. and Levy, David and Selic, Bran and Chen, Shiping}, + title = {A survey of fault tolerance mechanisms and checkpoint/restart implementations for high performance computing systems}, + year = {2013}, + journal = {The Journal of Supercomputing}, + publisher = {Springer Science and Business Media LLC}, + volume = {65}, + pages = {1302--1326}, + doi = {10.1007/s11227-013-0884-0}, + number = {3}, + source = {Crossref}, + url = {https://doi.org/10.1007/s11227-013-0884-0}, + issn = {0920-8542, 1573-0484}, + month = feb, } -@article{rashid2014characterizing, -title={Characterizing the impact of intermittent hardware faults on programs}, -author={Rashid, Layali and Pattabiraman, Karthik and Gopalakrishnan, Sathish}, -journal={IEEE Transactions on Reliability}, -volume={64}, -number={1}, -pages={297--310}, -year={2014}, -publisher={IEEE} +@inproceedings{eisenman2022check, + author = {Eisenman, Assaf and Matam, Kiran Kumar and Ingram, Steven and Mudigere, Dheevatsa and Krishnamoorthi, Raghuraman and Nair, Krishnakumar and Smelyanskiy, Misha and Annavaram, Murali}, + title = {{Check-N-Run}: {A} checkpointing system for training deep learning recommendation models}, + year = {2022}, + booktitle = {19th USENIX Symposium on Networked Systems Design and Implementation (NSDI 22)}, + pages = {929--943}, } -@inproceedings{constantinescu2008intermittent, -title={Intermittent faults and effects on reliability of integrated circuits}, -author={Constantinescu, Cristian}, -booktitle={2008 Annual Reliability and Maintainability Symposium}, -pages={370--374}, -year={2008}, -organization={IEEE} +@inproceedings{francalanza2017foundation, + author = {Francalanza, Adrian and Aceto, Luca and Achilleos, Antonis and Attard, Duncan Paul and Cassar, Ian and Della Monica, Dario and Ing\'olfsd\'ottir, Anna}, + title = {A foundation for runtime monitoring}, + year = {2017}, + booktitle = {International Conference on Runtime Verification}, + pages = {8--29}, + organization = {Springer}, } -@inproceedings{zhang2018thundervolt, -title={Thundervolt: enabling aggressive voltage underscaling and timing error resilience for energy efficient deep learning accelerators}, -author={Zhang, Jeff and Rangineni, Kartheek and Ghodsi, Zahra and Garg, Siddharth}, -booktitle={Proceedings of the 55th Annual Design Automation Conference (DAC)}, -pages={1--6}, -year={2018} +@inproceedings{fursov2021adversarial, + author = {Fursov, Ivan and Morozov, Matvey and Kaploukhaya, Nina and Kovtun, Elizaveta and Rivera-Castro, Rodrigo and Gusev, Gleb and Babaev, Dmitry and Kireev, Ivan and Zaytsev, Alexey and Burnaev, Evgeny}, + title = {Adversarial Attacks on Deep Models for Financial Transaction Records}, + year = {2021}, + booktitle = {Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery \& Data Mining}, + pages = {2868--2878}, + doi = {10.1145/3447548.3467145}, + source = {Crossref}, + url = {https://doi.org/10.1145/3447548.3467145}, + publisher = {ACM}, + month = aug, } -@inproceedings{he2023understanding, -title={Understanding and mitigating hardware failures in deep learning training systems}, -author={He, Yi and Hutton, Mike and Chan, Steven and De Gruijl, Robert and Govindaraju, Rama and Patil, Nishant and Li, Yanjing}, -booktitle={Proceedings of the 50th Annual International Symposium on Computer Architecture}, -pages={1--16}, -year={2023} +@inproceedings{grafe2023large, + author = {Gr\"afe, Ralf and Sha, Qutub Syed and Geissler, Florian and Paulitsch, Michael}, + title = {Large-Scale Application of Fault Injection into {PyTorch} Models -an Extension to {PyTorchFI} for Validation Efficiency}, + year = {2023}, + booktitle = {2023 53rd Annual IEEE/IFIP International Conference on Dependable Systems and Networks - Supplemental Volume (DSN-S)}, + pages = {56--62}, + organization = {IEEE}, + doi = {10.1109/dsn-s58398.2023.00025}, + source = {Crossref}, + url = {https://doi.org/10.1109/dsn-s58398.2023.00025}, + publisher = {IEEE}, + month = jun, } -@inproceedings{rashid2012intermittent, -title={Intermittent hardware errors recovery: Modeling and evaluation}, -author={Rashid, Layali and Pattabiraman, Karthik and Gopalakrishnan, Sathish}, -booktitle={2012 Ninth International Conference on Quantitative Evaluation of Systems}, -pages={220--229}, -year={2012}, -organization={IEEE} +@inproceedings{guo2019simple, + author = {Guo, Chuan and Gardner, Jacob and You, Yurong and Wilson, Andrew Gordon and Weinberger, Kilian}, + title = {Simple black-box adversarial attacks}, + year = {2019}, + booktitle = {International conference on machine learning}, + pages = {2484--2493}, + organization = {PMLR}, } -@article{bushnell2002built, -title={Built-in self-test}, -author={Bushnell, Michael L and Agrawal, Vishwani D}, -journal={Essentials of electronic testing for digital, memory and mixed-signal VLSI circuits}, -pages={489--548}, -year={2002}, -publisher={Springer} +@article{hamming1950error, + author = {Hamming, R. W.}, + title = {Error Detecting and Error Correcting Codes}, + year = {1950}, + journal = {Bell Syst. Tech. J.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {29}, + number = {2}, + pages = {147--160}, + doi = {10.1002/j.1538-7305.1950.tb00463.x}, + source = {Crossref}, + url = {https://doi.org/10.1002/j.1538-7305.1950.tb00463.x}, + issn = {0005-8580}, + month = apr, } -@article{hamming1950error, -title={Error detecting and error correcting codes}, -author={Hamming, Richard W}, -journal={The Bell system technical journal}, -volume={29}, -number={2}, -pages={147--160}, -year={1950}, -publisher={Nokia Bell Labs} +@inproceedings{he2020fidelity, + author = {He, Yi and Balaprakash, Prasanna and Li, Yanjing}, + title = {{FIdelity:} {Efficient} Resilience Analysis Framework for Deep Learning Accelerators}, + year = {2020}, + booktitle = {2020 53rd Annual IEEE/ACM International Symposium on Microarchitecture (MICRO)}, + pages = {270--281}, + organization = {IEEE}, + doi = {10.1109/micro50266.2020.00033}, + source = {Crossref}, + url = {https://doi.org/10.1109/micro50266.2020.00033}, + publisher = {IEEE}, + month = oct, } -@inproceedings{sheaffer2007hardware, -title={A hardware redundancy and recovery mechanism for reliable scientific computation on graphics processors}, -author={Sheaffer, Jeremy W and Luebke, David P and Skadron, Kevin}, -booktitle={Graphics Hardware}, -volume={2007}, -pages={55--64}, -year={2007}, -organization={Citeseer} +@inproceedings{he2023understanding, + author = {He, Yi and Hutton, Mike and Chan, Steven and De Gruijl, Robert and Govindaraju, Rama and Patil, Nishant and Li, Yanjing}, + title = {Understanding and Mitigating Hardware Failures in Deep Learning Training Systems}, + year = {2023}, + booktitle = {Proceedings of the 50th Annual International Symposium on Computer Architecture}, + pages = {1--16}, + doi = {10.1145/3579371.3589105}, + source = {Crossref}, + url = {https://doi.org/10.1145/3579371.3589105}, + publisher = {ACM}, + month = jun, } -@article{arifeen2020approximate, -title={Approximate triple modular redundancy: A survey}, -author={Arifeen, Tooba and Hassan, Abdus Sami and Lee, Jeong-A}, -journal={IEEE Access}, -volume={8}, -pages={139851--139867}, -year={2020}, -publisher={IEEE} +@article{hendrycks2019benchmarking, + author = {Hendrycks, Dan and Dietterich, Thomas}, + title = {Benchmarking neural network robustness to common corruptions and perturbations}, + year = {2019}, + journal = {arXiv preprint arXiv:1903.12261}, } -@inproceedings{yeh1996triple, -title={Triple-triple redundant 777 primary flight computer}, -author={Yeh, Ying C}, -booktitle={1996 IEEE Aerospace Applications Conference. Proceedings}, -volume={1}, -pages={293--307}, -year={1996}, -organization={IEEE} +@inproceedings{hong2019terminal, + author = {Hong, Sanghyun and Frigo, Pietro and Kaya, Yi\u{g}itcan and Giuffrida, Cristiano and DumitraČ™, Tudor}, + title = {Terminal brain damage: {Exposing} the graceless degradation in deep neural networks under hardware fault attacks}, + year = {2019}, + booktitle = {28th USENIX Security Symposium (USENIX Security 19)}, + pages = {497--514}, } -@inproceedings{bannon2019computer, -title={Computer and redundancy solution for the full self-driving computer}, -author={Bannon, Pete and Venkataramanan, Ganesh and Sarma, Debjit Das and Talpes, Emil}, -booktitle={2019 IEEE Hot Chips 31 Symposium (HCS)}, -pages={1--22}, -year={2019}, -organization={IEEE Computer Society} +@inproceedings{hsiao2023mavfi, + author = {Hsiao, Yu-Shun and Wan, Zishen and Jia, Tianyu and Ghosal, Radhika and Mahmoud, Abdulrahman and Raychowdhury, Arijit and Brooks, David and Wei, Gu-Yeon and Reddi, Vijay Janapa}, + title = {{MAVFI:} {An} End-to-End Fault Analysis Framework with Anomaly Detection and Recovery for Micro Aerial Vehicles}, + year = {2023}, + booktitle = {2023 Design, Automation \& Test in Europe Conference \& Exhibition (DATE)}, + pages = {1--6}, + organization = {IEEE}, + doi = {10.23919/date56975.2023.10137246}, + source = {Crossref}, + url = {https://doi.org/10.23919/date56975.2023.10137246}, + publisher = {IEEE}, + month = apr, } -@inproceedings{pont2002using, -title={Using watchdog timers to improve the reliability of single-processor embedded systems: Seven new patterns and a case study}, -author={Pont, Michael J and Ong, Royan HL}, -booktitle={Proceedings of the First Nordic Conference on Pattern Languages of Programs}, -pages={159--200}, -year={2002}, -organization={Citeseer} +@article{hsiao2023silent, + author = {Hsiao, Yu-Shun and Wan, Zishen and Jia, Tianyu and Ghosal, Radhika and Mahmoud, Abdulrahman and Raychowdhury, Arijit and Brooks, David and Wei, Gu-Yeon and Reddi, Vijay Janapa}, + title = {Silent Data Corruption in Robot Operating System: {A} Case for End-to-End System-Level Fault Analysis Using Autonomous {UAVs}}, + year = {2024}, + journal = {IEEE Trans. Comput. Aided Des. Integr. Circuits Syst.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + doi = {10.1109/tcad.2023.3332293}, + number = {4}, + source = {Crossref}, + url = {https://doi.org/10.1109/tcad.2023.3332293}, + volume = {43}, + issn = {0278-0070, 1937-4151}, + pages = {1037--1050}, + month = apr, } -@inproceedings{francalanza2017foundation, -title={A foundation for runtime monitoring}, -author={Francalanza, Adrian and Aceto, Luca and Achilleos, Antonis and Attard, Duncan Paul and Cassar, Ian and Della Monica, Dario and Ing{\'o}lfsd{\'o}ttir, Anna}, -booktitle={International Conference on Runtime Verification}, -pages={8--29}, -year={2017}, -organization={Springer} +@inproceedings{jha2019ml, + author = {Jha, Saurabh and Banerjee, Subho and Tsai, Timothy and Hari, Siva K. S. and Sullivan, Michael B. and Kalbarczyk, Zbigniew T. and Keckler, Stephen W. and Iyer, Ravishankar K.}, + title = {{ML}-Based Fault Injection for Autonomous Vehicles: {A} Case for {Bayesian} Fault Injection}, + year = {2019}, + booktitle = {2019 49th Annual IEEE/IFIP International Conference on Dependable Systems and Networks (DSN)}, + pages = {112--124}, + organization = {IEEE}, + doi = {10.1109/dsn.2019.00025}, + source = {Crossref}, + url = {https://doi.org/10.1109/dsn.2019.00025}, + publisher = {IEEE}, + month = jun, } -@article{chandola2009anomaly, -title={Anomaly detection: A survey}, -author={Chandola, Varun and Banerjee, Arindam and Kumar, Vipin}, -journal={ACM computing surveys (CSUR)}, -volume={41}, -number={3}, -pages={1--58}, -year={2009}, -publisher={ACM New York, NY, USA} +@inproceedings{kawazoe1997heartbeat, + author = {Kawazoe Aguilera, Marcos and Chen, Wei and Toueg, Sam}, + title = {Heartbeat: {A} timeout-free failure detector for quiescent reliable communication}, + year = {1997}, + booktitle = {Distributed Algorithms: 11th International Workshop, WDAG'97 Saarbr\"ucken, Germany, September 24{\textendash}26, 1997 Proceedings 11}, + pages = {126--140}, + organization = {Springer}, } -@article{lindholm2019data, -title={Data consistency approach to model validation}, -author={Lindholm, Andreas and Zachariah, Dave and Stoica, Petre and Sch{\"o}n, Thomas B}, -journal={IEEE Access}, -volume={7}, -pages={59788--59796}, -year={2019}, -publisher={IEEE} +@inproceedings{kim2015bamboo, + author = {Kim, Jungrae and Sullivan, Michael and Erez, Mattan}, + title = {Bamboo {ECC:} {Strong,} safe, and flexible codes for reliable computer memory}, + year = {2015}, + booktitle = {2015 IEEE 21st International Symposium on High Performance Computer Architecture (HPCA)}, + pages = {101--112}, + organization = {IEEE}, + doi = {10.1109/hpca.2015.7056025}, + source = {Crossref}, + url = {https://doi.org/10.1109/hpca.2015.7056025}, + publisher = {IEEE}, + month = feb, } -@inproceedings{wan2023vpp, -title={Vpp: The vulnerability-proportional protection paradigm towards reliable autonomous machines}, -author={Wan, Zishen and Gan, Yiming and Yu, Bo and Liu, S and Raychowdhury, A and Zhu, Y}, -booktitle={Proceedings of the 5th International Workshop on Domain Specific System Architecture (DOSSA)}, -pages={1--6}, -year={2023} +@article{kirkpatrick2017overcoming, + author = {Kirkpatrick, James and Pascanu, Razvan and Rabinowitz, Neil and Veness, Joel and Desjardins, Guillaume and Rusu, Andrei A. and Milan, Kieran and Quan, John and Ramalho, Tiago and Grabska-Barwinska, Agnieszka and Hassabis, Demis and Clopath, Claudia and Kumaran, Dharshan and Hadsell, Raia}, + title = {Overcoming catastrophic forgetting in neural networks}, + year = {2017}, + journal = {Proc. Natl. Acad. Sci.}, + publisher = {Proceedings of the National Academy of Sciences}, + volume = {114}, + number = {13}, + pages = {3521--3526}, + doi = {10.1073/pnas.1611835114}, + source = {Crossref}, + url = {https://doi.org/10.1073/pnas.1611835114}, + issn = {0027-8424, 1091-6490}, + month = mar, } -@inproceedings{kawazoe1997heartbeat, -title={Heartbeat: A timeout-free failure detector for quiescent reliable communication}, -author={Kawazoe Aguilera, Marcos and Chen, Wei and Toueg, Sam}, -booktitle={Distributed Algorithms: 11th International Workshop, WDAG'97 Saarbr{\"u}cken, Germany, September 24--26, 1997 Proceedings 11}, -pages={126--140}, -year={1997}, -organization={Springer} +@article{ko2021characterizing, + author = {Ko, Yohan}, + title = {Characterizing System-Level Masking Effects against Soft Errors}, + year = {2021}, + journal = {Electronics}, + publisher = {MDPI AG}, + volume = {10}, + number = {18}, + pages = {2286}, + doi = {10.3390/electronics10182286}, + source = {Crossref}, + url = {https://doi.org/10.3390/electronics10182286}, + issn = {2079-9292}, + month = sep, } -@inproceedings{reis2005swift, -title={SWIFT: Software implemented fault tolerance}, -author={Reis, George A and Chang, Jonathan and Vachharajani, Neil and Rangan, Ram and August, David I}, -booktitle={International symposium on Code generation and optimization}, -pages={243--254}, -year={2005}, -organization={IEEE} +@article{lee2022design, + author = {Lee, Minwoong and Lee, Namho and Gwon, Huijeong and Kim, Jongyeol and Hwang, Younggwan and Cho, Seongik}, + title = {Design of Radiation-Tolerant High-Speed Signal Processing Circuit for Detecting Prompt Gamma Rays by Nuclear Explosion}, + year = {2022}, + journal = {Electronics}, + publisher = {MDPI AG}, + volume = {11}, + number = {18}, + pages = {2970}, + doi = {10.3390/electronics11182970}, + source = {Crossref}, + url = {https://doi.org/10.3390/electronics11182970}, + issn = {2079-9292}, + month = sep, } -@article{plank1997tutorial, -title={A tutorial on Reed--Solomon coding for fault-tolerance in RAID-like systems}, -author={Plank, James S}, -journal={Software: Practice and Experience}, -volume={27}, -number={9}, -pages={995--1012}, -year={1997}, -publisher={Wiley Online Library} +@inproceedings{li2017understanding, + author = {Li, Guanpeng and Hari, Siva Kumar Sastry and Sullivan, Michael and Tsai, Timothy and Pattabiraman, Karthik and Emer, Joel and Keckler, Stephen W.}, + title = {Understanding error propagation in deep learning neural network {(DNN)} accelerators and applications}, + year = {2017}, + booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis}, + pages = {1--12}, + doi = {10.1145/3126908.3126964}, + source = {Crossref}, + url = {https://doi.org/10.1145/3126908.3126964}, + publisher = {ACM}, + month = nov, } -@article{ye2021thundernna, -title={Thundernna: a white box adversarial attack}, -author={Ye, Linfeng and Hamidi, Shayan Mohajer}, -journal={arXiv preprint arXiv:2111.12305}, -year={2021} +@article{li2021survey, + author = {Li, Qinbin and Wen, Zeyi and Wu, Zhaomin and Hu, Sixu and Wang, Naibo and Li, Yuan and Liu, Xu and He, Bingsheng}, + title = {A Survey on Federated Learning Systems: {Vision,} Hype and Reality for Data Privacy and Protection}, + year = {2023}, + journal = {IEEE Trans. Knowl. Data Eng.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {35}, + number = {4}, + pages = {3347--3366}, + doi = {10.1109/tkde.2021.3124599}, + source = {Crossref}, + url = {https://doi.org/10.1109/tkde.2021.3124599}, + issn = {1041-4347, 1558-2191, 2326-3865}, + month = apr, } -@inproceedings{guo2019simple, -title={Simple black-box adversarial attacks}, -author={Guo, Chuan and Gardner, Jacob and You, Yurong and Wilson, Andrew Gordon and Weinberger, Kilian}, -booktitle={International conference on machine learning}, -pages={2484--2493}, -year={2019}, -organization={PMLR} +@article{lindholm2019data, + author = {Lindholm, Andreas and Zachariah, Dave and Stoica, Petre and Schon, Thomas B.}, + title = {Data Consistency Approach to Model Validation}, + year = {2019}, + journal = {\#IEEE\_O\_ACC\#}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {7}, + pages = {59788--59796}, + doi = {10.1109/access.2019.2915109}, + source = {Crossref}, + url = {https://doi.org/10.1109/access.2019.2915109}, + issn = {2169-3536}, } -@article{xu2021grey, -title={Grey-box adversarial attack and defence for sentiment classification}, -author={Xu, Ying and Zhong, Xu and Yepes, Antonio Jimeno and Lau, Jey Han}, -journal={arXiv preprint arXiv:2103.11576}, -year={2021} +@article{lopez2017gradient, + author = {Lopez-Paz, David and Ranzato, Marc'Aurelio}, + title = {Gradient episodic memory for continual learning}, + year = {2017}, + journal = {Adv Neural Inf Process Syst}, + volume = {30}, } -@inproceedings{carlini2017towards, -title={Towards evaluating the robustness of neural networks}, -author={Carlini, Nicholas and Wagner, David}, -booktitle={2017 ieee symposium on security and privacy (sp)}, -pages={39--57}, -year={2017}, -organization={Ieee} +@article{lowe2020gem5, + author = {Lowe-Power, Jason and Ahmad, Abdul Mutaal and Akram, Ayaz and Alian, Mohammad and Amslinger, Rico and Andreozzi, Matteo and Armejach, Adri\`a and Asmussen, Nils and Beckmann, Brad and Bharadwaj, Srikant and others}, + title = {The gem5 simulator: {Version} 20.0+}, + year = {2020}, + journal = {arXiv preprint arXiv:2007.03152}, } -@article{tsai2023adversarial, -title={Adversarial Attacks on Medical Image Classification}, -author={Tsai, Min-Jen and Lin, Ping-Yi and Lee, Ming-En}, -journal={Cancers}, -volume={15}, -number={17}, -pages={4228}, -year={2023}, -publisher={MDPI} +@inproceedings{ma2024dr, + author = {Ma, Dongning and Lin, Fred and Desmaison, Alban and Coburn, Joel and Moore, Daniel and Sankar, Sriram and Jiao, Xun}, + title = {{Dr.} {DNA:} {Combating} Silent Data Corruptions in Deep Learning using Distribution of Neuron Activations}, + year = {2024}, + booktitle = {Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3}, + pages = {239--252}, + doi = {10.1145/3620666.3651349}, + source = {Crossref}, + url = {https://doi.org/10.1145/3620666.3651349}, + publisher = {ACM}, + month = apr, } -@inproceedings{fursov2021adversarial, -title={Adversarial attacks on deep models for financial transaction records}, -author={Fursov, Ivan and Morozov, Matvey and Kaploukhaya, Nina and Kovtun, Elizaveta and Rivera-Castro, Rodrigo and Gusev, Gleb and Babaev, Dmitry and Kireev, Ivan and Zaytsev, Alexey and Burnaev, Evgeny}, -booktitle={Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery \& Data Mining}, -pages={2868--2878}, -year={2021} +@article{maas2008combining, + author = {Maas, Martin and Andersen, David G. and Isard, Michael and Javanmard, Mohammad Mahdi and McKinley, Kathryn S. and Raffel, Colin}, + title = {Combining Machine Learning and Lifetime-Based Resource Management for Memory Allocation and Beyond}, + year = {2024}, + journal = {Commun. ACM}, + publisher = {Association for Computing Machinery (ACM)}, + pages = {87--96}, + doi = {10.1145/3611018}, + number = {4}, + source = {Crossref}, + url = {https://doi.org/10.1145/3611018}, + volume = {67}, + issn = {0001-0782, 1557-7317}, + month = mar, } -@article{bai2021recent, -title={Recent advances in adversarial training for adversarial robustness}, -author={Bai, Tao and Luo, Jinqi and Zhao, Jun and Wen, Bihan and Wang, Qian}, -journal={arXiv preprint arXiv:2102.01356}, -year={2021} +@article{madry2017towards, + author = {Madry, Aleksander and Makelov, Aleksandar and Schmidt, Ludwig and Tsipras, Dimitris and Vladu, Adrian}, + title = {Towards deep learning models resistant to adversarial attacks}, + year = {2017}, + journal = {arXiv preprint arXiv:1706.06083}, } -@inproceedings{addepalli2020towards, -title={Towards achieving adversarial robustness by enforcing feature consistency across bit planes}, -author={Addepalli, Sravanti and BS, Vivek and Baburaj, Arya and Sriramanan, Gaurang and Babu, R Venkatesh}, -booktitle={Proceedings of the IEEE/CVF conference on computer vision and pattern recognition}, -pages={1020--1029}, -year={2020} +@inproceedings{mahmoud2020pytorchfi, + author = {Mahmoud, Abdulrahman and Aggarwal, Neeraj and Nobbe, Alex and Vicarte, Jose Rodrigo Sanchez and Adve, Sarita V. and Fletcher, Christopher W. and Frosio, Iuri and Hari, Siva Kumar Sastry}, + title = {{PyTorchFI:} {A} Runtime Perturbation Tool for {DNNs}}, + year = {2020}, + booktitle = {2020 50th Annual IEEE/IFIP International Conference on Dependable Systems and Networks Workshops (DSN-W)}, + pages = {25--31}, + organization = {IEEE}, + doi = {10.1109/dsn-w50199.2020.00014}, + source = {Crossref}, + url = {https://doi.org/10.1109/dsn-w50199.2020.00014}, + publisher = {IEEE}, + month = jun, } @article{marulli2022sensitivity, -title={Sensitivity of machine learning approaches to fake and untrusted data in healthcare domain}, -author={Marulli, Fiammetta and Marrone, Stefano and Verde, Laura}, -journal={Journal of Sensor and Actuator Networks}, -volume={11}, -number={2}, -pages={21}, -year={2022}, -publisher={MDPI} + author = {Marulli, Fiammetta and Marrone, Stefano and Verde, Laura}, + title = {Sensitivity of Machine Learning Approaches to Fake and Untrusted Data in Healthcare Domain}, + year = {2022}, + journal = {Journal of Sensor and Actuator Networks}, + publisher = {MDPI AG}, + volume = {11}, + number = {2}, + pages = {21}, + doi = {10.3390/jsan11020021}, + source = {Crossref}, + url = {https://doi.org/10.3390/jsan11020021}, + issn = {2224-2708}, + month = mar, } -@inproceedings{zhou2018learning, -title={Learning rich features for image manipulation detection}, -author={Zhou, Peng and Han, Xintong and Morariu, Vlad I and Davis, Larry S}, -booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition}, -pages={1053--1061}, -year={2018} +@inproceedings{mohanram2003partial, + author = {Mohanram, K. and Touba, N.A.}, + title = {Partial error masking to reduce soft error failure rate in logic circuits}, + year = {2003}, + booktitle = {Proceedings. 16th IEEE Symposium on Computer Arithmetic}, + pages = {433--440}, + organization = {IEEE}, + doi = {10.1109/dftvs.2003.1250141}, + source = {Crossref}, + url = {https://doi.org/10.1109/dftvs.2003.1250141}, + publisher = {IEEE Comput. Soc}, } -@article{carta2020local, -title={A local feature engineering strategy to improve network anomaly detection}, -author={Carta, Salvatore and Podda, Alessandro Sebastian and Recupero, Diego Reforgiato and Saia, Roberto}, -journal={Future Internet}, -volume={12}, -number={10}, -pages={177}, -year={2020}, -publisher={MDPI} +@inproceedings{mukherjee2005soft, + author = {Mukherjee, S.S. and Emer, J. and Reinhardt, S.K.}, + title = {The Soft Error Problem: {An} Architectural Perspective}, + year = {2005}, + booktitle = {11th International Symposium on High-Performance Computer Architecture}, + pages = {243--247}, + organization = {IEEE}, + doi = {10.1109/hpca.2005.37}, + source = {Crossref}, + url = {https://doi.org/10.1109/hpca.2005.37}, + publisher = {IEEE}, } -@article{berger2014kolmogorov, -title={Kolmogorov--smirnov test: Overview}, -author={Berger, Vance W and Zhou, YanYan}, -journal={Wiley statsref: Statistics reference online}, -year={2014}, -publisher={Wiley Online Library} +@article{myllyaho2022misbehaviour, + author = {Myllyaho, Lalli and Raatikainen, Mikko and M\"annist\"o, Tomi and Nurminen, Jukka K. and Mikkonen, Tommi}, + title = {On misbehaviour and fault tolerance in machine learning systems}, + year = {2022}, + journal = {J. Syst. Software}, + publisher = {Elsevier BV}, + volume = {183}, + pages = {111096}, + doi = {10.1016/j.jss.2021.111096}, + source = {Crossref}, + url = {https://doi.org/10.1016/j.jss.2021.111096}, + issn = {0164-1212}, + month = jan, } @article{panda2019discretization, -title={Discretization based solutions for secure machine learning against adversarial attacks}, -author={Panda, Priyadarshini and Chakraborty, Indranil and Roy, Kaushik}, -journal={IEEE Access}, -volume={7}, -pages={70157--70168}, -year={2019}, -publisher={IEEE} + author = {Panda, Priyadarshini and Chakraborty, Indranil and Roy, Kaushik}, + title = {Discretization Based Solutions for Secure Machine Learning Against Adversarial Attacks}, + year = {2019}, + journal = {\#IEEE\_O\_ACC\#}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {7}, + pages = {70157--70168}, + doi = {10.1109/access.2019.2919463}, + source = {Crossref}, + url = {https://doi.org/10.1109/access.2019.2919463}, + issn = {2169-3536}, } -@article{madry2017towards, -title={Towards deep learning models resistant to adversarial attacks}, -author={Madry, Aleksander and Makelov, Aleksandar and Schmidt, Ludwig and Tsipras, Dimitris and Vladu, Adrian}, -journal={arXiv preprint arXiv:1706.06083}, -year={2017} +@inproceedings{papadimitriou2021demystifying, + author = {Papadimitriou, George and Gizopoulos, Dimitris}, + title = {Demystifying the System Vulnerability Stack: {Transient} Fault Effects Across the Layers}, + year = {2021}, + booktitle = {2021 ACM/IEEE 48th Annual International Symposium on Computer Architecture (ISCA)}, + pages = {902--915}, + organization = {IEEE}, + doi = {10.1109/isca52012.2021.00075}, + source = {Crossref}, + url = {https://doi.org/10.1109/isca52012.2021.00075}, + publisher = {IEEE}, + month = jun, } @inproceedings{papernot2016distillation, -title={Distillation as a defense to adversarial perturbations against deep neural networks}, -author={Papernot, Nicolas and McDaniel, Patrick and Wu, Xi and Jha, Somesh and Swami, Ananthram}, -booktitle={2016 IEEE symposium on security and privacy (SP)}, -pages={582--597}, -year={2016}, -organization={IEEE} -} - -@article{hendrycks2019benchmarking, -title={Benchmarking neural network robustness to common corruptions and perturbations}, -author={Hendrycks, Dan and Dietterich, Thomas}, -journal={arXiv preprint arXiv:1903.12261}, -year={2019} -} - -@article{beaton1974fitting, -title={The fitting of power series, meaning polynomials, illustrated on band-spectroscopic data}, -author={Beaton, Albert E and Tukey, John W}, -journal={Technometrics}, -volume={16}, -number={2}, -pages={147--185}, -year={1974}, -publisher={Taylor \& Francis} + author = {Papernot, Nicolas and McDaniel, Patrick and Wu, Xi and Jha, Somesh and Swami, Ananthram}, + title = {Distillation as a Defense to Adversarial Perturbations Against Deep Neural Networks}, + year = {2016}, + booktitle = {2016 IEEE Symposium on Security and Privacy (SP)}, + pages = {582--597}, + organization = {IEEE}, + doi = {10.1109/sp.2016.41}, + source = {Crossref}, + url = {https://doi.org/10.1109/sp.2016.41}, + publisher = {IEEE}, + month = may, } -@article{kirkpatrick2017overcoming, -title={Overcoming catastrophic forgetting in neural networks}, -author={Kirkpatrick, James and Pascanu, Razvan and Rabinowitz, Neil and Veness, Joel and Desjardins, Guillaume and Rusu, Andrei A and Milan, Kieran and Quan, John and Ramalho, Tiago and Grabska-Barwinska, Agnieszka and others}, -journal={Proceedings of the national academy of sciences}, -volume={114}, -number={13}, -pages={3521--3526}, -year={2017}, -publisher={National Acad Sciences} -} - -@article{lopez2017gradient, -title={Gradient episodic memory for continual learning}, -author={Lopez-Paz, David and Ranzato, Marc'Aurelio}, -journal={Advances in neural information processing systems}, -volume={30}, -year={2017} +@article{plank1997tutorial, + author = {Plank, James S}, + title = {A tutorial on {Reed{\textendash}Solomon} coding for fault-tolerance in {RAID}-like systems}, + year = {1997}, + journal = {Software: Practice and Experience}, + publisher = {Wiley Online Library}, + volume = {27}, + number = {9}, + pages = {995--1012}, } -@article{myllyaho2022misbehaviour, -title={On misbehaviour and fault tolerance in machine learning systems}, -author={Myllyaho, Lalli and Raatikainen, Mikko and M{\"a}nnist{\"o}, Tomi and Nurminen, Jukka K and Mikkonen, Tommi}, -journal={Journal of Systems and Software}, -volume={183}, -pages={111096}, -year={2022}, -publisher={Elsevier} +@inproceedings{pont2002using, + author = {Pont, Michael J and Ong, Royan HL}, + title = {Using watchdog timers to improve the reliability of single-processor embedded systems: {Seven} new patterns and a case study}, + year = {2002}, + booktitle = {Proceedings of the First Nordic Conference on Pattern Languages of Programs}, + pages = {159--200}, + organization = {Citeseer}, } -@article{zhang2008distribution, -title={On the distribution of software faults}, -author={Zhang, Hongyu}, -journal={IEEE Transactions on Software Engineering}, -volume={34}, -number={2}, -pages={301--302}, -year={2008}, -publisher={IEEE} +@inproceedings{rashid2012intermittent, + author = {Rashid, Layali and Pattabiraman, Karthik and Gopalakrishnan, Sathish}, + title = {Intermittent Hardware Errors Recovery: {Modeling} and Evaluation}, + year = {2012}, + booktitle = {2012 Ninth International Conference on Quantitative Evaluation of Systems}, + pages = {220--229}, + organization = {IEEE}, + doi = {10.1109/qest.2012.37}, + source = {Crossref}, + url = {https://doi.org/10.1109/qest.2012.37}, + publisher = {IEEE}, + month = sep, } -@article{maas2008combining, -title={Combining Machine Learning and Lifetime-Based Resource Management for Memory Allocation and Beyond}, -author={Maas, Martin and Andersen, David G and Isard, Michael and Javanmard, Mohammad Mahdi and McKinley, Kathryn S and Raffel, Colin}, -journal={Communications of the ACM}, -pages={1--10}, -year={2008}, -publisher={ACM New York, NY} +@article{rashid2014characterizing, + author = {Rashid, Layali and Pattabiraman, Karthik and Gopalakrishnan, Sathish}, + title = {Characterizing the Impact of Intermittent Hardware Faults on Programs}, + year = {2015}, + journal = {IEEE Trans. Reliab.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {64}, + number = {1}, + pages = {297--310}, + doi = {10.1109/tr.2014.2363152}, + source = {Crossref}, + url = {https://doi.org/10.1109/tr.2014.2363152}, + issn = {0018-9529, 1558-1721}, + month = mar, } -@article{li2021survey, -title={A survey on federated learning systems: Vision, hype and reality for data privacy and protection}, -author={Li, Qinbin and Wen, Zeyi and Wu, Zhaomin and Hu, Sixu and Wang, Naibo and Li, Yuan and Liu, Xu and He, Bingsheng}, -journal={IEEE Transactions on Knowledge and Data Engineering}, -volume={35}, -number={4}, -pages={3347--3366}, -year={2021}, -publisher={IEEE} +@inproceedings{reagen2018ares, + author = {Reagen, Brandon and Gupta, Udit and Pentecost, Lillian and Whatmough, Paul and Lee, Sae Kyu and Mulholland, Niamh and Brooks, David and Wei, Gu-Yeon}, + title = {Ares: {A} framework for quantifying the resilience of deep neural networks}, + year = {2018}, + booktitle = {2018 55th ACM/ESDA/IEEE Design Automation Conference (DAC)}, + pages = {1--6}, + doi = {10.1109/dac.2018.8465834}, + source = {Crossref}, + url = {https://doi.org/10.1109/dac.2018.8465834}, + publisher = {IEEE}, + month = jun, } -@inproceedings{eisenman2022check, -title={$\{$Check-N-Run$\}$: A checkpointing system for training deep learning recommendation models}, -author={Eisenman, Assaf and Matam, Kiran Kumar and Ingram, Steven and Mudigere, Dheevatsa and Krishnamoorthi, Raghuraman and Nair, Krishnakumar and Smelyanskiy, Misha and Annavaram, Murali}, -booktitle={19th USENIX Symposium on Networked Systems Design and Implementation (NSDI 22)}, -pages={929--943}, -year={2022} +@inproceedings{reis2005swift, + author = {Reis, G.A. and Chang, J. and Vachharajani, N. and Rangan, R. and August, D.I.}, + title = {{SWIFT:} {Software} Implemented Fault Tolerance}, + year = {2005}, + booktitle = {International Symposium on Code Generation and Optimization}, + pages = {243--254}, + organization = {IEEE}, + doi = {10.1109/cgo.2005.34}, + source = {Crossref}, + url = {https://doi.org/10.1109/cgo.2005.34}, + publisher = {IEEE}, } @inproceedings{sangchoolie2017one, -title={One bit is (not) enough: An empirical study of the impact of single and multiple bit-flip errors}, -author={Sangchoolie, Behrooz and Pattabiraman, Karthik and Karlsson, Johan}, -booktitle={2017 47th annual IEEE/IFIP international conference on dependable systems and networks (DSN)}, -pages={97--108}, -year={2017}, -organization={IEEE} -} - -@inproceedings{wilkening2014calculating, -title={Calculating architectural vulnerability factors for spatial multi-bit transient faults}, -author={Wilkening, Mark and Sridharan, Vilas and Li, Si and Previlon, Fritz and Gurumurthi, Sudhanva and Kaeli, David R}, -booktitle={2014 47th Annual IEEE/ACM International Symposium on Microarchitecture}, -pages={293--305}, -year={2014}, -organization={IEEE} -} - -@article{binkert2011gem5, -title={The gem5 simulator}, -author={Binkert, Nathan and Beckmann, Bradford and Black, Gabriel and Reinhardt, Steven K and Saidi, Ali and Basu, Arkaprava and Hestness, Joel and Hower, Derek R and Krishna, Tushar and Sardashti, Somayeh and others}, -journal={ACM SIGARCH computer architecture news}, -volume={39}, -number={2}, -pages={1--7}, -year={2011}, -publisher={ACM New York, NY, USA} -} - -@article{lowe2020gem5, -title={The gem5 simulator: Version 20.0+}, -author={Lowe-Power, Jason and Ahmad, Abdul Mutaal and Akram, Ayaz and Alian, Mohammad and Amslinger, Rico and Andreozzi, Matteo and Armejach, Adri{\`a} and Asmussen, Nils and Beckmann, Brad and Bharadwaj, Srikant and others}, -journal={arXiv preprint arXiv:2007.03152}, -year={2020} + author = {Sangchoolie, Behrooz and Pattabiraman, Karthik and Karlsson, Johan}, + title = {One Bit is {(Not)} Enough: {An} Empirical Study of the Impact of Single and Multiple Bit-Flip Errors}, + year = {2017}, + booktitle = {2017 47th Annual IEEE/IFIP International Conference on Dependable Systems and Networks (DSN)}, + pages = {97--108}, + organization = {IEEE}, + doi = {10.1109/dsn.2017.30}, + source = {Crossref}, + url = {https://doi.org/10.1109/dsn.2017.30}, + publisher = {IEEE}, + month = jun, } -@inproceedings{sangchoolie2017one, -title={One bit is (not) enough: An empirical study of the impact of single and multiple bit-flip errors}, -author={Sangchoolie, Behrooz and Pattabiraman, Karthik and Karlsson, Johan}, -booktitle={2017 47th annual IEEE/IFIP international conference on dependable systems and networks (DSN)}, -pages={97--108}, -year={2017}, -organization={IEEE} +@inproceedings{seong2010safer, + author = {Seong, Nak Hee and Woo, Dong Hyuk and Srinivasan, Vijayalakshmi and Rivers, Jude A. and Lee, Hsien-Hsin S.}, + title = {{SAFER:} {Stuck-at-fault} Error Recovery for Memories}, + year = {2010}, + booktitle = {2010 43rd Annual IEEE/ACM International Symposium on Microarchitecture}, + pages = {115--124}, + organization = {IEEE}, + doi = {10.1109/micro.2010.46}, + source = {Crossref}, + url = {https://doi.org/10.1109/micro.2010.46}, + publisher = {IEEE}, + month = dec, } -@inproceedings{papadimitriou2021demystifying, -title={Demystifying the system vulnerability stack: Transient fault effects across the layers}, -author={Papadimitriou, George and Gizopoulos, Dimitris}, -booktitle={2021 ACM/IEEE 48th Annual International Symposium on Computer Architecture (ISCA)}, -pages={902--915}, -year={2021}, -organization={IEEE} +@inproceedings{sheaffer2007hardware, + author = {Sheaffer, Jeremy W and Luebke, David P and Skadron, Kevin}, + title = {A hardware redundancy and recovery mechanism for reliable scientific computation on graphics processors}, + year = {2007}, + booktitle = {Graphics Hardware}, + volume = {2007}, + pages = {55--64}, + organization = {Citeseer}, } -@inproceedings{mohanram2003partial, -title={Partial error masking to reduce soft error failure rate in logic circuits}, -author={Mohanram, Kartik and Touba, Nur A}, -booktitle={Proceedings 18th IEEE Symposium on Defect and Fault Tolerance in VLSI Systems}, -pages={433--440}, -year={2003}, -organization={IEEE} +@inproceedings{tambe2020algorithm, + author = {Tambe, Thierry and Yang, En-Yu and Wan, Zishen and Deng, Yuntian and Janapa Reddi, Vijay and Rush, Alexander and Brooks, David and Wei, Gu-Yeon}, + title = {Algorithm-Hardware Co-Design of Adaptive Floating-Point Encodings for Resilient Deep Learning Inference}, + year = {2020}, + booktitle = {2020 57th ACM/IEEE Design Automation Conference (DAC)}, + pages = {1--6}, + organization = {IEEE}, + doi = {10.1109/dac18072.2020.9218516}, + source = {Crossref}, + url = {https://doi.org/10.1109/dac18072.2020.9218516}, + publisher = {IEEE}, + month = jul, } -@article{ko2021characterizing, -title={Characterizing System-Level Masking Effects against Soft Errors}, -author={Ko, Yohan}, -journal={Electronics}, -volume={10}, -number={18}, -pages={2286}, -year={2021}, -publisher={MDPI} +@inproceedings{tsai2021nvbitfi, + author = {Tsai, Timothy and Hari, Siva Kumar Sastry and Sullivan, Michael and Villa, Oreste and Keckler, Stephen W.}, + title = {{NVBitFI:} {Dynamic} Fault Injection for {GPUs}}, + year = {2021}, + booktitle = {2021 51st Annual IEEE/IFIP International Conference on Dependable Systems and Networks (DSN)}, + pages = {284--291}, + organization = {IEEE}, + doi = {10.1109/dsn48987.2021.00041}, + source = {Crossref}, + url = {https://doi.org/10.1109/dsn48987.2021.00041}, + publisher = {IEEE}, + month = jun, } -@article{ahmadilivani2024systematic, -title={A systematic literature review on hardware reliability assessment methods for deep neural networks}, -author={Ahmadilivani, Mohammad Hasan and Taheri, Mahdi and Raik, Jaan and Daneshtalab, Masoud and Jenihhin, Maksim}, -journal={ACM Computing Surveys}, -volume={56}, -number={6}, -pages={1--39}, -year={2024}, -publisher={ACM New York, NY} +@article{tsai2023adversarial, + author = {Tsai, Min-Jen and Lin, Ping-Yi and Lee, Ming-En}, + title = {Adversarial Attacks on Medical Image Classification}, + year = {2023}, + journal = {Cancers}, + publisher = {MDPI AG}, + volume = {15}, + number = {17}, + pages = {4228}, + doi = {10.3390/cancers15174228}, + source = {Crossref}, + url = {https://doi.org/10.3390/cancers15174228}, + issn = {2072-6694}, + month = aug, } @article{velazco2010combining, -title={Combining results of accelerated radiation tests and fault injections to predict the error rate of an application implemented in SRAM-based FPGAs}, -author={Velazco, Raoul and Foucard, Gilles and Peronnard, Paul}, -journal={IEEE Transactions on Nuclear Science}, -volume={57}, -number={6}, -pages={3500--3505}, -year={2010}, -publisher={IEEE} + author = {Velazco, Raoul and Foucard, Gilles and Peronnard, Paul}, + title = {Combining Results of Accelerated Radiation Tests and Fault Injections to Predict the Error Rate of an Application Implemented in {SRAM}-Based {FPGAs}}, + year = {2010}, + journal = {IEEE Trans. Nucl. Sci.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {57}, + number = {6}, + pages = {3500--3505}, + doi = {10.1109/tns.2010.2087355}, + source = {Crossref}, + url = {https://doi.org/10.1109/tns.2010.2087355}, + issn = {0018-9499}, + month = dec, } -@article{lee2022design, -title={Design of Radiation-Tolerant High-Speed Signal Processing Circuit for Detecting Prompt Gamma Rays by Nuclear Explosion}, -author={Lee, Minwoong and Lee, Namho and Gwon, Huijeong and Kim, Jongyeol and Hwang, Younggwan and Cho, Seongik}, -journal={Electronics}, -volume={11}, -number={18}, -pages={2970}, -year={2022}, -publisher={MDPI} -} - -@inproceedings{reagen2018ares, -title={Ares: A framework for quantifying the resilience of deep neural networks}, -author={Reagen, Brandon and Gupta, Udit and Pentecost, Lillian and Whatmough, Paul and Lee, Sae Kyu and Mulholland, Niamh and Brooks, David and Wei, Gu-Yeon}, -booktitle={Proceedings of the 55th Annual Design Automation Conference}, -pages={1--6}, -year={2018} +@inproceedings{wan2021analyzing, + author = {Wan, Zishen and Anwar, Aqeel and Hsiao, Yu-Shun and Jia, Tianyu and Reddi, Vijay Janapa and Raychowdhury, Arijit}, + title = {Analyzing and Improving Fault Tolerance of Learning-Based Navigation Systems}, + year = {2021}, + booktitle = {2021 58th ACM/IEEE Design Automation Conference (DAC)}, + pages = {841--846}, + organization = {IEEE}, + doi = {10.1109/dac18074.2021.9586116}, + source = {Crossref}, + url = {https://doi.org/10.1109/dac18074.2021.9586116}, + publisher = {IEEE}, + month = dec, } -@inproceedings{mahmoud2020pytorchfi, -title={Pytorchfi: A runtime perturbation tool for dnns}, -author={Mahmoud, Abdulrahman and Aggarwal, Neeraj and Nobbe, Alex and Vicarte, Jose Rodrigo Sanchez and Adve, Sarita V and Fletcher, Christopher W and Frosio, Iuri and Hari, Siva Kumar Sastry}, -booktitle={2020 50th Annual IEEE/IFIP International Conference on Dependable Systems and Networks Workshops (DSN-W)}, -pages={25--31}, -year={2020}, -organization={IEEE} +@inproceedings{wan2023vpp, + author = {Wan, Zishen and Gan, Yiming and Yu, Bo and Liu, S and Raychowdhury, A and Zhu, Y}, + title = {Vpp: {The} vulnerability-proportional protection paradigm towards reliable autonomous machines}, + year = {2023}, + booktitle = {Proceedings of the 5th International Workshop on Domain Specific System Architecture (DOSSA)}, + pages = {1--6}, } -@inproceedings{ma2024dr, -title={Dr. DNA: Combating Silent Data Corruptions in Deep Learning using Distribution of Neuron Activations}, -author={Ma, Dongning and Lin, Fred and Desmaison, Alban and Coburn, Joel and Moore, Daniel and Sankar, Sriram and Jiao, Xun}, -booktitle={Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3}, -pages={239--252}, -year={2024} +@inproceedings{wilkening2014calculating, + author = {Wilkening, Mark and Sridharan, Vilas and Li, Si and Previlon, Fritz and Gurumurthi, Sudhanva and Kaeli, David R.}, + title = {Calculating Architectural Vulnerability Factors for Spatial Multi-Bit Transient Faults}, + year = {2014}, + booktitle = {2014 47th Annual IEEE/ACM International Symposium on Microarchitecture}, + pages = {293--305}, + organization = {IEEE}, + doi = {10.1109/micro.2014.15}, + source = {Crossref}, + url = {https://doi.org/10.1109/micro.2014.15}, + publisher = {IEEE}, + month = dec, } -@inproceedings{tambe2020algorithm, -title={Algorithm-hardware co-design of adaptive floating-point encodings for resilient deep learning inference}, -author={Tambe, Thierry and Yang, En-Yu and Wan, Zishen and Deng, Yuntian and Reddi, Vijay Janapa and Rush, Alexander and Brooks, David and Wei, Gu-Yeon}, -booktitle={2020 57th ACM/IEEE Design Automation Conference (DAC)}, -pages={1--6}, -year={2020}, -organization={IEEE} +@article{xu2021grey, + author = {Xu, Ying and Zhong, Xu and Yepes, Antonio Jimeno and Lau, Jey Han}, + title = {{Grey}-box adversarial attack and defence for sentiment classification}, + year = {2021}, + journal = {arXiv preprint arXiv:2103.11576}, } -@inproceedings{chen2020tensorfi, -title={Tensorfi: A flexible fault injection framework for tensorflow applications}, -author={Chen, Zitao and Narayanan, Niranjhana and Fang, Bo and Li, Guanpeng and Pattabiraman, Karthik and DeBardeleben, Nathan}, -booktitle={2020 IEEE 31st International Symposium on Software Reliability Engineering (ISSRE)}, -pages={426--435}, -year={2020}, -organization={IEEE} +@article{ye2021thundernna, + author = {Ye, Linfeng and Hamidi, Shayan Mohajer}, + title = {Thundernna: {A} white box adversarial attack}, + year = {2021}, + journal = {arXiv preprint arXiv:2111.12305}, } -@inproceedings{tsai2021nvbitfi, -title={Nvbitfi: Dynamic fault injection for gpus}, -author={Tsai, Timothy and Hari, Siva Kumar Sastry and Sullivan, Michael and Villa, Oreste and Keckler, Stephen W}, -booktitle={2021 51st Annual IEEE/IFIP International Conference on Dependable Systems and Networks (DSN)}, -pages={284--291}, -year={2021}, -organization={IEEE} +@inproceedings{yeh1996triple, + author = {Yeh, Y.C.}, + title = {Triple-triple redundant 777 primary flight computer}, + year = {1996}, + booktitle = {1996 IEEE Aerospace Applications Conference. Proceedings}, + volume = {1}, + pages = {293--307}, + organization = {IEEE}, + doi = {10.1109/aero.1996.495891}, + source = {Crossref}, + url = {https://doi.org/10.1109/aero.1996.495891}, + publisher = {IEEE}, } -@inproceedings{jha2019ml, -title={Ml-based fault injection for autonomous vehicles: A case for bayesian fault injection}, -author={Jha, Saurabh and Banerjee, Subho and Tsai, Timothy and Hari, Siva KS and Sullivan, Michael B and Kalbarczyk, Zbigniew T and Keckler, Stephen W and Iyer, Ravishankar K}, -booktitle={2019 49th annual IEEE/IFIP international conference on dependable systems and networks (DSN)}, -pages={112--124}, -year={2019}, -organization={IEEE} +@article{zhang2008distribution, + author = {Zhang, Hongyu}, + title = {On the Distribution of Software Faults}, + year = {2008}, + journal = {IEEE Trans. Software Eng.}, + publisher = {Institute of Electrical and Electronics Engineers (IEEE)}, + volume = {34}, + number = {2}, + pages = {301--302}, + doi = {10.1109/tse.2007.70771}, + source = {Crossref}, + url = {https://doi.org/10.1109/tse.2007.70771}, + issn = {0098-5589}, + month = mar, } -@inproceedings{grafe2023large, -title={Large-scale application of fault injection into pytorch models-an extension to pytorchfi for validation efficiency}, -author={Gr{\"a}fe, Ralf and Sha, Qutub Syed and Geissler, Florian and Paulitsch, Michael}, -booktitle={2023 53rd Annual IEEE/IFIP International Conference on Dependable Systems and Networks-Supplemental Volume (DSN-S)}, -pages={56--62}, -year={2023}, -organization={IEEE} +@inproceedings{zhang2018analyzing, + author = {Zhang, Jeff Jun and Gu, Tianyu and Basu, Kanad and Garg, Siddharth}, + title = {Analyzing and mitigating the impact of permanent faults on a systolic array based neural network accelerator}, + year = {2018}, + booktitle = {2018 IEEE 36th VLSI Test Symposium (VTS)}, + pages = {1--6}, + organization = {IEEE}, + doi = {10.1109/vts.2018.8368656}, + source = {Crossref}, + url = {https://doi.org/10.1109/vts.2018.8368656}, + publisher = {IEEE}, + month = apr, } -@inproceedings{hsiao2023mavfi, -title={Mavfi: An end-to-end fault analysis framework with anomaly detection and recovery for micro aerial vehicles}, -author={Hsiao, Yu-Shun and Wan, Zishen and Jia, Tianyu and Ghosal, Radhika and Mahmoud, Abdulrahman and Raychowdhury, Arijit and Brooks, David and Wei, Gu-Yeon and Reddi, Vijay Janapa}, -booktitle={2023 Design, Automation \& Test in Europe Conference \& Exhibition (DATE)}, -pages={1--6}, -year={2023}, -organization={IEEE} +@inproceedings{zhang2018thundervolt, + author = {Zhang, Jeff and Rangineni, Kartheek and Ghodsi, Zahra and Garg, Siddharth}, + title = {{ThUnderVolt:} {Enabling} Aggressive Voltage Underscaling and Timing Error Resilience for Energy Efficient Deep Learning Accelerators}, + year = {2018}, + booktitle = {2018 55th ACM/ESDA/IEEE Design Automation Conference (DAC)}, + pages = {1--6}, + doi = {10.1109/dac.2018.8465918}, + source = {Crossref}, + url = {https://doi.org/10.1109/dac.2018.8465918}, + publisher = {IEEE}, + month = jun, } -@article{bolchini2022fast, -title={Fast and accurate error simulation for cnns against soft errors}, -author={Bolchini, Cristiana and Cassano, Luca and Miele, Antonio and Toschi, Alessandro}, -journal={IEEE Transactions on Computers}, -volume={72}, -number={4}, -pages={984--997}, -year={2022}, -publisher={IEEE} +@inproceedings{zhou2018learning, + author = {Zhou, Peng and Han, Xintong and Morariu, Vlad I. and Davis, Larry S.}, + title = {Learning Rich Features for Image Manipulation Detection}, + year = {2018}, + booktitle = {2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition}, + pages = {1053--1061}, + doi = {10.1109/cvpr.2018.00116}, + source = {Crossref}, + url = {https://doi.org/10.1109/cvpr.2018.00116}, + publisher = {IEEE}, + month = jun, } - -@inproceedings{he2020fidelity, -title={Fidelity: Efficient resilience analysis framework for deep learning accelerators}, -author={He, Yi and Balaprakash, Prasanna and Li, Yanjing}, -booktitle={2020 53rd Annual IEEE/ACM International Symposium on Microarchitecture (MICRO)}, -pages={270--281}, -year={2020}, -organization={IEEE} -} \ No newline at end of file