DietCode: Automatic Optimization for Dynamic Tensor Programs
Bojian Zheng, Ziheng Jiang, Cody Hao Yu, Haichen Shen, Josh Fromm, Yizhi Liu, Yida Wang, Luis Ceze, Tianqi Chen, Gennady Pekhimenko
MLSys, August 2022 (To Appear)
Bojian Zheng, Ziheng Jiang, Cody Hao Yu, Haichen Shen, Josh Fromm, Yizhi Liu, Yida Wang, Luis Ceze, Tianqi Chen, Gennady Pekhimenko
MLSys, August 2022 (To Appear)
Roller: Fast and Efficient Tensor Compilation for Deep Learning
Hongyu Zhu, Gennady Pekhimenko et al.
OSDI, July 2022 (To Appear)
Hongyu Zhu, Gennady Pekhimenko et al.
OSDI, July 2022 (To Appear)
@article{UofTEcoSystem_Yaoyao_Ding_MASc_Thesis,
author = {Yaoyao Ding},
title = {IOS: Inter-Operator Scheduler for CNN Acceleration},
year = {2021},
url = {https://www.cs.toronto.edu/ecosystem/papers/Theses/Yaoyao_Ding-MASc_2022.pdf}
}
Benchmarking, Profiling and White-Box Performance Modeling for DNN Training
BibTeX
Hongyu Zhu
PhD Thesis, February 2022
Hongyu Zhu
PhD Thesis, February 2022
@article{UofTEcoSystem_Hongyu_Zhu_PhD_Thesis,
author = {Hongyu Zhu},
title = {Benchmarking, Profiling and White-Box Performance Modeling for {DNN} Training},
year = {2022},
url = {https://www.cs.toronto.edu/ecosystem/papers/Theses/Hongyu_Zhu-PhD_2022.pdf}
}
Automatic Horizontal Fusion for GPU Kernels
BibTeX
Ao Li, Bojian Zheng, Gennady Pekhimenko, Fan Long
CGO, February 2022
Ao Li, Bojian Zheng, Gennady Pekhimenko, Fan Long
CGO, February 2022
@article{UofTEcoSystem_Horizontal_Fusion,
author = {Ao Li and
Bojian Zheng and
Gennady Pekhimenko and
Fan Long},
title = {Automatic Horizontal Fusion for {GPU} Kernels},
journal = {CoRR},
volume = {abs/2007.01277},
year = {2020},
url = {https://arxiv.org/abs/2007.01277},
eprinttype = {arXiv},
eprint = {2007.01277},
timestamp = {Mon, 06 Jul 2020 15:26:01 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2007-01277.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Enabling Privacy-Preserving Model Personalization via On-Device Incremental Training
BibTeX
Jiacheng Yang
MASc Thesis, December 2021
Jiacheng Yang
MASc Thesis, December 2021
@article{UofTEcoSystem_Jiacheng_Yang_MASc_Thesis,
author = {Jiacheng Yang},
title = {Enabling Privacy-Preserving Model Personalization via On-Device Incremental Training},
year = {2021},
url = {https://www.cs.toronto.edu/ecosystem/papers/Theses/Jiacheng_Yang-MASc_2021.pdf}
}
Moshpit SGD: Communication-Efficient Decentralized Training on Heterogeneous Unreliable Devices
BibTeX
Max Ryabinin, Eduard Gorbunov, Vsevolod Plokhotnyuk, Gennady Pekhimenko
NeurIPS, December 2021
Max Ryabinin, Eduard Gorbunov, Vsevolod Plokhotnyuk, Gennady Pekhimenko
NeurIPS, December 2021
@article{UofTEcoSystem_Moshpit_SGD,
title = {{Moshpit SGD}: Communication-Efficient Decentralized Training on Heterogeneous Unreliable Devices},
author = {Max Ryabinin and Eduard Gorbunov and Vsevolod Plokhotnyuk and Gennady Pekhimenko},
booktitle = {Advances in Neural Information Processing Systems},
editor = {A. Beygelzimer and Y. Dauphin and P. Liang and J. Wortman Vaughan},
year = {2021},
url = {https://openreview.net/forum?id=cwWfDHYpb1z}
}
Distributed Deep Learning In Open Collaborations
BibTeX
Michael Diskin, Alexey Bukhtiyarov, Max Ryabinin, Lucile Saulnier, Quentin Lhoest, Anton Sinitsin, Dmitriy Popov, Dmitry Pyrkin, Maxim Kashirin, Alexander Borzunov, Albert Villanova del Moral, Denis Mazur, Ilia Kobelev, Yacine Jernite, Thomas Wolf, Gennady Pekhimenko
NeurIPS, December 2021
Michael Diskin, Alexey Bukhtiyarov, Max Ryabinin, Lucile Saulnier, Quentin Lhoest, Anton Sinitsin, Dmitriy Popov, Dmitry Pyrkin, Maxim Kashirin, Alexander Borzunov, Albert Villanova del Moral, Denis Mazur, Ilia Kobelev, Yacine Jernite, Thomas Wolf, Gennady Pekhimenko
NeurIPS, December 2021
@article{UofTEcoSystem_Distrib_Training_in_Open_Collab,
title = {Distributed Deep Learning In Open Collaborations},
author = {Michael Diskin and
Alexey Bukhtiyarov and
Max Ryabinin and
Lucile Saulnier and
Quentin Lhoest and
Anton Sinitsin and
Dmitry Popov and
Dmitriy Pyrkin and
Maxim Kashirin and
Alexander Borzunov and
Albert Villanova del Moral and
Denis Mazur and
Ilia Kobelev and
Yacine Jernite and
Thomas Wolf and
Gennady Pekhimenko},
booktitle = {Advances in Neural Information Processing Systems},
editor = {A. Beygelzimer and Y. Dauphin and P. Liang and J. Wortman Vaughan},
year = {2021},
url = {https://openreview.net/forum?id=FYHktcK-7v}
}
FPRaker: A Processing Element For Accelerating Neural Network Training
BibTeX
Omar Mohamed Awad, Mostafa Mahmoud, Isak Edo, Ali Hadi Zadeh, Ciaran Bannon, Anand Jayarajan, Gennady Pekhimenko, Andreas Moshovos
MICRO, October 2021
Omar Mohamed Awad, Mostafa Mahmoud, Isak Edo, Ali Hadi Zadeh, Ciaran Bannon, Anand Jayarajan, Gennady Pekhimenko, Andreas Moshovos
MICRO, October 2021
@inproceedings{UofTEcoSystem_FPRaker,
author = {Omar Mohamed Awad and
Mostafa Mahmoud and
Isak Edo and
Ali Hadi Zadeh and
Ciaran Bannon and
Anand Jayarajan and
Gennady Pekhimenko and
Andreas Moshovos},
title = {{FPRaker}: A Processing Element For Accelerating Neural Network Training},
booktitle = {{MICRO} '21: 54th Annual {IEEE/ACM} International Symposium on Microarchitecture,
Virtual Event, Greece, October 18-22, 2021},
pages = {857--869},
publisher = {{ACM}},
year = {2021},
url = {https://doi.org/10.1145/3466752.3480106},
doi = {10.1145/3466752.3480106},
timestamp = {Tue, 19 Oct 2021 16:42:06 +0200},
biburl = {https://dblp.org/rec/conf/micro/AwadMEZBJPM21.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
MedPerf: Open Benchmarking Platform for Medical Artificial Intelligence using Federated Evaluation
BibTeX
Alexandros Karargyris, Renato Umeton, Micah J. Sheller, Alejandro Aristizabal, Johnu George, Srini Bala, Daniel J. Beutel, Victor Bittorf, Akshay Chaudhari, Alexander Chowdhury, Cody Coleman, Bala Desinghu, Gregory Diamos, Debo Dutta, Diane Feddema, Grigori Fursin, Junyi Guo, Xinyuan Huang, David Kanter, Satyananda Kashyap, Nicholas Lane, Indranil Mallick, Pietro Mascagni, Virendra Mehta, Vivek Natarajan, Nikola Nikolov, Nicolas Padoy, Gennady Pekhimenko, Vijay Janapa Reddi, G Anthony Reina, Pablo Ribalta, Jacob Rosenthal, Abhishek Singh, Jayaraman J. Thiagarajan, Anna Wuest, Maria Xenochristou, Daguang Xu, Poonam Yadav, Michael Rosenthal, Massimo Loda, Jason M. Johnson, Peter Mattson
ArXiv, September 2021
Alexandros Karargyris, Renato Umeton, Micah J. Sheller, Alejandro Aristizabal, Johnu George, Srini Bala, Daniel J. Beutel, Victor Bittorf, Akshay Chaudhari, Alexander Chowdhury, Cody Coleman, Bala Desinghu, Gregory Diamos, Debo Dutta, Diane Feddema, Grigori Fursin, Junyi Guo, Xinyuan Huang, David Kanter, Satyananda Kashyap, Nicholas Lane, Indranil Mallick, Pietro Mascagni, Virendra Mehta, Vivek Natarajan, Nikola Nikolov, Nicolas Padoy, Gennady Pekhimenko, Vijay Janapa Reddi, G Anthony Reina, Pablo Ribalta, Jacob Rosenthal, Abhishek Singh, Jayaraman J. Thiagarajan, Anna Wuest, Maria Xenochristou, Daguang Xu, Poonam Yadav, Michael Rosenthal, Massimo Loda, Jason M. Johnson, Peter Mattson
ArXiv, September 2021
@article{UofTEcoSystem_MedPerf,
author = {Alexandros Karargyris and
Renato Umeton and
Micah J. Sheller and
Alejandro Aristizabal and
Johnu George and
Srini Bala and
Daniel J. Beutel and
Victor Bittorf and
Akshay Chaudhari and
Alexander Chowdhury and
Cody Coleman and
Bala Desinghu and
Gregory F. Diamos and
Debo Dutta and
Diane Feddema and
Grigori Fursin and
Junyi Guo and
Xinyuan Huang and
David Kanter and
Satyananda Kashyap and
Nicholas D. Lane and
Indranil Mallick and
Pietro Mascagni and
Virendra Mehta and
Vivek Natarajan and
Nikola Nikolov and
Nicolas Padoy and
Gennady Pekhimenko and
Vijay Janapa Reddi and
G. Anthony Reina and
Pablo Ribalta and
Jacob Rosenthal and
Abhishek Singh and
Jayaraman J. Thiagarajan and
Anna Wuest and
Maria Xenochristou and
Daguang Xu and
Poonam Yadav and
Michael Rosenthal and
Massimo Loda and
Jason M. Johnson and
Peter Mattson},
title = {{MedPerf}: Open Benchmarking Platform for Medical Artificial Intelligence
using Federated Evaluation},
journal = {CoRR},
volume = {abs/2110.01406},
year = {2021},
url = {https://arxiv.org/abs/2110.01406},
eprinttype = {arXiv},
eprint = {2110.01406},
timestamp = {Fri, 08 Oct 2021 15:47:55 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2110-01406.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Habitat: A Runtime-Based Computational Performance Predictor for Deep Neural Network Training
BibTeX
Geoffrey X. Yu, Yubo Gao, Pavel Golikov, Gennady Pekhimenko
USENIX ATC, July 2021
Geoffrey X. Yu, Yubo Gao, Pavel Golikov, Gennady Pekhimenko
USENIX ATC, July 2021
@inproceedings{UofTEcoSystem_Habitat,
author = {Geoffrey X. Yu and
Yubo Gao and
Pavel Golikov and
Gennady Pekhimenko},
editor = {Irina Calciu and
Geoff Kuenning},
title = {{Habitat}: A Runtime-Based Computational Performance Predictor for
Deep Neural Network Training},
booktitle = {2021 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2021, July
14-16, 2021},
pages = {503--521},
publisher = {{USENIX} Association},
year = {2021},
url = {https://www.usenix.org/conference/atc21/presentation/yu},
timestamp = {Thu, 12 Aug 2021 18:08:26 +0200},
biburl = {https://dblp.org/rec/conf/usenix/YuGGP21.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
NVOverlay: Enabling Efficient and Scalable High-Frequency Snapshotting to NVM
BibTeX
Ziqi Wang, Chul-Hwan Choo, Michael A. Kozuch, Todd C. Mowry, Gennady Pekhimenko, Vivek Seshadri, Dimitrios Skarlatos
ISCA, June 2021
Ziqi Wang, Chul-Hwan Choo, Michael A. Kozuch, Todd C. Mowry, Gennady Pekhimenko, Vivek Seshadri, Dimitrios Skarlatos
ISCA, June 2021
@article{UofTEcoSystem_NVOverlay,
author = {Ziqi Wang and
Chul{-}Hwan Choo and
Michael A. Kozuch and
Todd C. Mowry and
Gennady Pekhimenko and
Vivek Seshadri and
Dimitrios Skarlatos},
title = {{NVOverlay}: Enabling Efficient and Scalable High-Frequency Snapshotting
to {NVM}},
booktitle = {48th {ACM/IEEE} Annual International Symposium on Computer Architecture,
{ISCA} 2021, Valencia, Spain, June 14-18, 2021},
pages = {498--511},
publisher = {{IEEE}},
year = {2021},
url = {https://doi.org/10.1109/ISCA52012.2021.00046},
doi = {10.1109/ISCA52012.2021.00046},
timestamp = {Thu, 14 Oct 2021 10:17:42 +0200},
biburl = {https://dblp.org/rec/conf/isca/WangCKMPS021.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Horizontally Fused Training Array: An Effective Hardware Utilization Squeezer for Training Novel Deep Learning Models
BibTeX
Shang Wang, Peiming Yang, Yuxuan Zheng, Xin Li, Gennady Pekhimenko
MLSys, April 2021
Shang Wang, Peiming Yang, Yuxuan Zheng, Xin Li, Gennady Pekhimenko
MLSys, April 2021
@article{UofTEcoSystem_HFTA,
author = {Shang Wang and
Peiming Yang and
Yuxuan Zheng and
Xin Li and
Gennady Pekhimenko},
booktitle = {Proceedings of Machine Learning and Systems},
editor = {A. Smola and A. Dimakis and I. Stoica},
pages = {599--623},
title = {Horizontally Fused Training Array: An Effective Hardware Utilization Squeezer for Training Novel Deep Learning Models},
url = {https://proceedings.mlsys.org/paper/2021/file/a97da629b098b75c294dffdc3e463904-Paper.pdf},
volume = {3},
year = {2021}
}
RL-Scope: Cross-Stack Profiling for Deep Reinforcement Learning Workloads
BibTeX
James Gleeson, Srivatsan Krishnan, Moshe Gabel, Vijay Janapa Reddi, Eyal de Lara, Gennady Pekhimenko
MLSys, April 2021
James Gleeson, Srivatsan Krishnan, Moshe Gabel, Vijay Janapa Reddi, Eyal de Lara, Gennady Pekhimenko
MLSys, April 2021
@article{UofTEcoSystem_RLScope,
author = {James Gleeson and
Srivatsan Krishnan and
Moshe Gabel and
Vijay Janapa Reddi and
Eyal de Lara and
Gennady Pekhimenko},
booktitle = {Proceedings of Machine Learning and Systems},
editor = {A. Smola and A. Dimakis and I. Stoica},
pages = {783--799},
title = {{RL-Scope}: Cross-stack Profiling for Deep Reinforcement Learning Workloads},
url = {https://proceedings.mlsys.org/paper/2021/file/d1fe173d08e959397adf34b1d77e88d7-Paper.pdf},
volume = {3},
year = {2021}
}
IOS: Inter-Operator Scheduler for CNN Acceleration
BibTeX
Yaoyao Ding, Ligeng Zhu, Zhihao Jia, Gennady Pekhimenko, Song Han
MLSys, April 2021
Yaoyao Ding, Ligeng Zhu, Zhihao Jia, Gennady Pekhimenko, Song Han
MLSys, April 2021
@article{UofTEcoSystem_IOS,
author = {Yaoyao Ding and
Ligeng Zhu and
Zhihao Jia and
Gennady Pekhimenko and
Song Han},
booktitle = {Proceedings of Machine Learning and Systems},
editor = {A. Smola and A. Dimakis and I. Stoica},
pages = {167--180},
title = {{IOS}: Inter-Operator Scheduler for {CNN} Acceleration},
url = {https://proceedings.mlsys.org/paper/2021/file/38b3eff8baf56627478ec76a704e9b52-Paper.pdf},
volume = {3},
year = {2021}
}
Boveda: Building an On-Chip Deep Learning Memory Hierarchy Brick by Brick
Isak Edo Vivancos, Sayeh Sharify, Milos Nikolic, Ciaran Bannon, Mostafa Mahmoud, Alberto Delmas Lascorz, Gennady Pekhimenko, Andreas Moshovos
MLSys, April 2021
Isak Edo Vivancos, Sayeh Sharify, Milos Nikolic, Ciaran Bannon, Mostafa Mahmoud, Alberto Delmas Lascorz, Gennady Pekhimenko, Andreas Moshovos
MLSys, April 2021
@article{UofTEcoSystem_Boveda,
author = {Edo Vivancos, Isak and
Sharify, Sayeh and
Ly-Ma, Daniel and
Abdelhadi, Ameer and
Bannon, Ciaran and
Nikolic, Milos and
Mahmoud, Mostafa and
Delmas Lascorz, Alberto and
Pekhimenko, Gennady and
Moshovos, Andreas},
booktitle = {Proceedings of Machine Learning and Systems},
editor = {A. Smola and A. Dimakis and I. Stoica},
pages = {1--20},
title = {{Boveda}: Building an On-Chip Deep Learning Memory Hierarchy Brick by Brick},
url = {https://proceedings.mlsys.org/paper/2021/file/013d407166ec4fa56eb1e1f8cbe183b9-Paper.pdf},
volume = {3},
year = {2021}
}
LifeStream: A High-performance Stream Processing Engine for Waveform Data
BibTeX
Anand Jayarajan, Kimberly Hau, Andrew Goodwin, Gennady Pekhimenko
ASPLOS, April 2021
Anand Jayarajan, Kimberly Hau, Andrew Goodwin, Gennady Pekhimenko
ASPLOS, April 2021
@article{UofTEcoSystem_LifeStream,
author = {Anand Jayarajan and
Kimberly Hau and
Andrew Goodwin and
Gennady Pekhimenko},
editor = {Tim Sherwood and
Emery D. Berger and
Christos Kozyrakis},
title = {{LifeStream}: a high-performance stream processing engine for periodic
streams},
booktitle = {{ASPLOS} '21: 26th {ACM} International Conference on Architectural
Support for Programming Languages and Operating Systems, Virtual Event,
USA, April 19-23, 2021},
pages = {107--122},
publisher = {{ACM}},
year = {2021},
url = {https://doi.org/10.1145/3445814.3446725},
doi = {10.1145/3445814.3446725},
timestamp = {Sat, 08 Jan 2022 02:24:44 +0100},
biburl = {https://dblp.org/rec/conf/asplos/JayarajanHGP21.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Gretch: A Hardware Prefetcher for Graph Analytics
BibTeX
Anirudh Mohan Kaushik, Gennady Pekhimenko, Hiren Patel
TACO, February 2021
Anirudh Mohan Kaushik, Gennady Pekhimenko, Hiren Patel
TACO, February 2021
@article{UofTEcoSystem_Gretch,
author = {Anirudh Mohan Kaushik and
Gennady Pekhimenko and
Hiren Patel},
title = {{Gretch}: A Hardware Prefetcher for Graph Analytics},
year = {2021},
issue_date = {February 2021},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
volume = {18},
number = {2},
issn = {1544-3566},
url = {https://doi.org/10.1145/3439803},
doi = {10.1145/3439803},
journal = {ACM Transaction Architecture Code Optimization},
month = Feb,
articleno = {18},
numpages = {25},
keywords = {data-dependent memory accesses, Hardware prefetching, graph analytics}
}
TensorDash: Exploiting Sparsity to Accelerate Deep Neural Network Training
BibTeX
Mostafa Mahmoud, Isak Edo Vivancos, Ali Hadi Zadeh, Omar Mohamed Awad, Gennady Pekhimenko, Jorge Albericio, Andreas Moshovos
MICRO, October 2020
Mostafa Mahmoud, Isak Edo Vivancos, Ali Hadi Zadeh, Omar Mohamed Awad, Gennady Pekhimenko, Jorge Albericio, Andreas Moshovos
MICRO, October 2020
@inproceedings{UofTEcoSystem_TensorDash,
author = {Mostafa Mahmoud and
Isak Edo and
Ali Hadi Zadeh and
Omar Mohamed Awad and
Gennady Pekhimenko and
Jorge Albericio and
Andreas Moshovos},
title = {{TensorDash}: Exploiting Sparsity to Accelerate Deep Neural Network
Training},
booktitle = {53rd Annual {IEEE/ACM} International Symposium on Microarchitecture,
{MICRO} 2020, Athens, Greece, October 17-21, 2020},
pages = {781--795},
publisher = {{IEEE}},
year = {2020},
url = {https://doi.org/10.1109/MICRO50266.2020.00069},
doi = {10.1109/MICRO50266.2020.00069},
timestamp = {Tue, 17 Nov 2020 13:33:12 +0100},
biburl = {https://dblp.org/rec/conf/micro/MahmoudEZAPAM20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Skyline: Interactive In-Editor Computational Performance Profiling for Deep Neural Network Training
BibTeX
Geoffrey Yu, Tovi Grossman, Gennady Pekhimenko
UIST, October 2020
Geoffrey Yu, Tovi Grossman, Gennady Pekhimenko
UIST, October 2020
@inproceedings{UofTEcoSystem_Skyline,
author = {Geoffrey X. Yu and
Tovi Grossman and
Gennady Pekhimenko},
editor = {Shamsi T. Iqbal and
Karon E. MacLean and
Fanny Chevalier and
Stefanie Mueller},
title = {{Skyline}: Interactive In-Editor Computational Performance Profiling
for Deep Neural Network Training},
booktitle = {{UIST} '20: The 33rd Annual {ACM} Symposium on User Interface Software
and Technology, Virtual Event, USA, October 20-23, 2020},
pages = {126--139},
publisher = {{ACM}},
year = {2020},
url = {https://doi.org/10.1145/3379337.3415890},
doi = {10.1145/3379337.3415890},
timestamp = {Sun, 18 Oct 2020 18:35:39 +0200},
biburl = {https://dblp.org/rec/conf/uist/YuGP20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Multi-Node Bert-pretraining: Cost-efficient Approach
BibTeX
Jiahuang Lin, Xin Li, Gennady Pekhimenko
arXiv, August 2020
Jiahuang Lin, Xin Li, Gennady Pekhimenko
arXiv, August 2020
@misc{UofTEcoSystem_Multi_Node_BERT_Pretraining,
title = {Multi-Node {BERT}-Pretraining: Cost-efficient Approach},
author = {Jiahuang Lin and Xin Li and Gennady Pekhimenko},
year = {2020},
eprint = {2008.00177},
archivePrefix = {arXiv},
primaryClass = {cs.LG}
}
Daydream: Accurately Estimating the Efficacy of Optimizations for DNN Training
BibTeX
Hongyu Zhu, Amar Phanishayee, Gennady Pekhimenko
USENIX ATC, July 2020
Hongyu Zhu, Amar Phanishayee, Gennady Pekhimenko
USENIX ATC, July 2020
@inproceedings{UofTEcoSystem_Daydream,
author = {Hongyu Zhu and
Amar Phanishayee and
Gennady Pekhimenko},
editor = {Ada Gavrilovska and
Erez Zadok},
title = {{Daydream}: Accurately Estimating the Efficacy of Optimizations for
{DNN} Training},
booktitle = {2020 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2020, July
15-17, 2020},
pages = {337--352},
publisher = {{USENIX} Association},
year = {2020},
url = {https://www.usenix.org/conference/atc20/presentation/zhu-hongyu},
timestamp = {Mon, 01 Feb 2021 08:43:50 +0100},
biburl = {https://dblp.org/rec/conf/usenix/ZhuPP20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Echo: Compiler-based GPU Memory Footprint Reduction for LSTM RNN Training
BibTeX
Bojian Zheng, Abhishek Tiwari, Nandita Vijaykumar, Gennady Pekhimenko
ISCA, June 2020
Bojian Zheng, Abhishek Tiwari, Nandita Vijaykumar, Gennady Pekhimenko
ISCA, June 2020
@inproceedings{UofTEcoSystem_Echo,
author = {Bojian Zheng and
Nandita Vijaykumar and
Gennady Pekhimenko},
title = {{Echo}: Compiler-based {GPU} Memory Footprint Reduction for {LSTM} {RNN}
Training},
booktitle = {47th {ACM/IEEE} Annual International Symposium on Computer Architecture,
{ISCA} 2020, Valencia, Spain, May 30 - June 3, 2020},
pages = {1089--1102},
publisher = {{IEEE}},
year = {2020},
url = {https://doi.org/10.1109/ISCA45697.2020.00092},
doi = {10.1109/ISCA45697.2020.00092},
timestamp = {Wed, 22 Jul 2020 15:50:37 +0200},
biburl = {https://dblp.org/rec/conf/isca/ZhengVP20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
MLPerf Inference Benchmark
BibTeX
Vijay Janapa Reddi, Christine Cheng, David Kanter, Peter Mattson, Guenther Schmuelling, Carole-Jean Wu, Brian Anderson, Maximilien Breughe, Mark Charlebois, William Chou, Ramesh Chukka, Cody Coleman, Sam Davis, Pan Deng, Greg Diamos, Jared Duke, Dave Fick, J. Scott Gardner, Itay Hubara, Sachin Idgunji, Thomas B. Jablin, Jeff Jiao, Tom St. John, Pankaj Kanwar, David Lee, Jeffery Liao, Anton Lokhmotov, Francisco Massa, Peng Meng, Paulius Micikevicius, Colin Osborne, Gennady Pekhimenko, Arun Tejusve Raghunath Rajan, Dilip Sequeira, Ashish Sirasao, Fei Sun, Hanlin Tang, Michael Thomson, Frank Wei, Ephrem Wu, Lingjie Xu, Koichi Yamada, Bing Yu, George Yuan, Aaron Zhong, Peizhao Zhang, Yuchen Zhou
ISCA, June 2020
MICRO Top Picks
Vijay Janapa Reddi, Christine Cheng, David Kanter, Peter Mattson, Guenther Schmuelling, Carole-Jean Wu, Brian Anderson, Maximilien Breughe, Mark Charlebois, William Chou, Ramesh Chukka, Cody Coleman, Sam Davis, Pan Deng, Greg Diamos, Jared Duke, Dave Fick, J. Scott Gardner, Itay Hubara, Sachin Idgunji, Thomas B. Jablin, Jeff Jiao, Tom St. John, Pankaj Kanwar, David Lee, Jeffery Liao, Anton Lokhmotov, Francisco Massa, Peng Meng, Paulius Micikevicius, Colin Osborne, Gennady Pekhimenko, Arun Tejusve Raghunath Rajan, Dilip Sequeira, Ashish Sirasao, Fei Sun, Hanlin Tang, Michael Thomson, Frank Wei, Ephrem Wu, Lingjie Xu, Koichi Yamada, Bing Yu, George Yuan, Aaron Zhong, Peizhao Zhang, Yuchen Zhou
ISCA, June 2020
MICRO Top Picks
@inproceedings{UofTEcoSystem_MLPerf_Inference,
author = {Vijay Janapa Reddi and
Christine Cheng and
David Kanter and
Peter Mattson and
Guenther Schmuelling and
Carole{-}Jean Wu and
Brian Anderson and
Maximilien Breughe and
Mark Charlebois and
William Chou and
Ramesh Chukka and
Cody Coleman and
Sam Davis and
Pan Deng and
Greg Diamos and
Jared Duke and
Dave Fick and
J. Scott Gardner and
Itay Hubara and
Sachin Idgunji and
Thomas B. Jablin and
Jeff Jiao and
Tom St. John and
Pankaj Kanwar and
David Lee and
Jeffery Liao and
Anton Lokhmotov and
Francisco Massa and
Peng Meng and
Paulius Micikevicius and
Colin Osborne and
Gennady Pekhimenko and
Arun Tejusve Raghunath Rajan and
Dilip Sequeira and
Ashish Sirasao and
Fei Sun and
Hanlin Tang and
Michael Thomson and
Frank Wei and
Ephrem Wu and
Lingjie Xu and
Koichi Yamada and
Bing Yu and
George Yuan and
Aaron Zhong and
Peizhao Zhang and
Yuchen Zhou},
title = {MLPerf Inference Benchmark},
booktitle = {47th {ACM/IEEE} Annual International Symposium on Computer Architecture,
{ISCA} 2020, Valencia, Spain, May 30 - June 3, 2020},
pages = {446--459},
publisher = {{IEEE}},
year = {2020},
url = {https://doi.org/10.1109/ISCA45697.2020.00045},
doi = {10.1109/ISCA45697.2020.00045},
timestamp = {Wed, 22 Jul 2020 15:50:37 +0200},
biburl = {https://dblp.org/rec/conf/isca/ReddiCKMSWABCCC20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
BPPSA: Scaling Back-propagation by Parallel Scan Algorithm
BibTeX
Shang Wang, Yifan Bai, Gennady Pekhimenko
MLSys, March 2020
Shang Wang, Yifan Bai, Gennady Pekhimenko
MLSys, March 2020
@inproceedings{UofTEcoSystem_BPPSA,
author = {Shang Wang and
Yifan Bai and
Gennady Pekhimenko},
editor = {Inderjit S. Dhillon and
Dimitris S. Papailiopoulos and
Vivienne Sze},
title = {{BPPSA}: Scaling Back-propagation by Parallel Scan Algorithm},
booktitle = {Proceedings of Machine Learning and Systems 2020, MLSys 2020, Austin,
TX, USA, March 2-4, 2020},
publisher = {mlsys.org},
year = {2020},
url = {https://proceedings.mlsys.org/book/317.pdf},
timestamp = {Thu, 18 Jun 2020 15:48:04 +0200},
biburl = {https://dblp.org/rec/conf/mlsys/0002BP20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
MLPerf Training Benchmark
BibTeX
Peter Mattson, Christine Cheng, Cody Coleman, Greg Diamos, Paulius Micikevicius, David Patterson, Hanlin Tang, Gu-Yeon Wei, Peter Bailis, Victor Bittorf, David Brooks, Dehao Chen, Debojyoti Dutta, Udit Gupta, Kim Hazelwood, Andrew Hock, Xinyuan Huang, Bill Jia, Daniel Kang, David Kanter, Naveen Kumar, Jeffery Liao, Deepak Narayanan, Tayo Oguntebi, Gennady Pekhimenko, Lillian Pentecost, Vijay Janapa Reddi, Taylor Robie, Tom St. John, Carole-Jean Wu, Lingjie Xu, Cliff Young, Matei Zaharia
MLSys, March 2020
Peter Mattson, Christine Cheng, Cody Coleman, Greg Diamos, Paulius Micikevicius, David Patterson, Hanlin Tang, Gu-Yeon Wei, Peter Bailis, Victor Bittorf, David Brooks, Dehao Chen, Debojyoti Dutta, Udit Gupta, Kim Hazelwood, Andrew Hock, Xinyuan Huang, Bill Jia, Daniel Kang, David Kanter, Naveen Kumar, Jeffery Liao, Deepak Narayanan, Tayo Oguntebi, Gennady Pekhimenko, Lillian Pentecost, Vijay Janapa Reddi, Taylor Robie, Tom St. John, Carole-Jean Wu, Lingjie Xu, Cliff Young, Matei Zaharia
MLSys, March 2020
@inproceedings{UofTEcoSystem_MLPerf_Training,
author = {Peter Mattson and
Christine Cheng and
Gregory F. Diamos and
Cody Coleman and
Paulius Micikevicius and
David A. Patterson and
Hanlin Tang and
Gu{-}Yeon Wei and
Peter Bailis and
Victor Bittorf and
David Brooks and
Dehao Chen and
Debo Dutta and
Udit Gupta and
Kim M. Hazelwood and
Andy Hock and
Xinyuan Huang and
Daniel Kang and
David Kanter and
Naveen Kumar and
Jeffery Liao and
Deepak Narayanan and
Tayo Oguntebi and
Gennady Pekhimenko and
Lillian Pentecost and
Vijay Janapa Reddi and
Taylor Robie and
Tom St. John and
Carole{-}Jean Wu and
Lingjie Xu and
Cliff Young and
Matei Zaharia},
editor = {Inderjit S. Dhillon and
Dimitris S. Papailiopoulos and
Vivienne Sze},
title = {MLPerf Training Benchmark},
booktitle = {Proceedings of Machine Learning and Systems 2020, MLSys 2020, Austin,
TX, USA, March 2-4, 2020},
publisher = {mlsys.org},
year = {2020},
url = {https://proceedings.mlsys.org/book/309.pdf},
timestamp = {Thu, 18 Jun 2020 15:48:04 +0200},
biburl = {https://dblp.org/rec/conf/mlsys/MattsonCDCMPTWB20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Towards Making the Most of BERT in Neural Machine Translation
BibTeX
Jiacheng Yang, Mingxuan Wang, Hao Zhou, Chengqi Zhao, Weinan Zhang, Yong Yu, Lei Li
AAAI, February 2020
Jiacheng Yang, Mingxuan Wang, Hao Zhou, Chengqi Zhao, Weinan Zhang, Yong Yu, Lei Li
AAAI, February 2020
@inproceedings{UofTEcoSystem_BERT_for_NMT,
author = {Jiacheng Yang and
Mingxuan Wang and
Hao Zhou and
Chengqi Zhao and
Weinan Zhang and
Yong Yu and
Lei Li},
title = {Towards Making the Most of {BERT} in Neural Machine Translation},
booktitle = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
2020, The Thirty-Second Innovative Applications of Artificial Intelligence
Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
February 7-12, 2020},
pages = {9378--9385},
publisher = {{AAAI} Press},
year = {2020},
url = {https://aaai.org/ojs/index.php/AAAI/article/view/6479},
timestamp = {Tue, 02 Feb 2021 08:00:21 +0100},
biburl = {https://dblp.org/rec/conf/aaai/YangW0Z00020.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Janus: Optimizing Memory and Storage Support for Non-Volatile Memory Systems
BibTeX
Sihang Liu, Korakit Seemakhupt, Gennady Pekhimenko, Aasheesh Kolli, and Samira Khan
ISCA, June 2019
MICRO Top Picks Honorable Mention
Sihang Liu, Korakit Seemakhupt, Gennady Pekhimenko, Aasheesh Kolli, and Samira Khan
ISCA, June 2019
MICRO Top Picks Honorable Mention
@inproceedings{UofTEcoSystem_Janus,
author = {Sihang Liu and
Korakit Seemakhupt and
Gennady Pekhimenko and
Aasheesh Kolli and
Samira Manabi Khan},
editor = {Srilatha Bobbie Manne and
Hillery C. Hunter and
Erik R. Altman},
title = {{Janus}: optimizing memory and storage support for non-volatile memory
systems},
booktitle = {Proceedings of the 46th International Symposium on Computer Architecture,
{ISCA} 2019, Phoenix, AZ, USA, June 22-26, 2019},
pages = {143--156},
publisher = {{ACM}},
year = {2019},
url = {https://doi.org/10.1145/3307650.3322206},
doi = {10.1145/3307650.3322206},
timestamp = {Tue, 29 Dec 2020 09:53:49 +0100},
biburl = {https://dblp.org/rec/conf/isca/0001SPKK19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Priority-based Parameter Propagation for Distributed DNN Training
BibTeX
Anand Jayarajan, Jinliang Wei, Garth Gibson, Alexandra Fedorova, Gennady Pekhimenko
SysML, April 2019
Anand Jayarajan, Jinliang Wei, Garth Gibson, Alexandra Fedorova, Gennady Pekhimenko
SysML, April 2019
@inproceedings{UofTEcoSystem_P3,
author = {Anand Jayarajan and
Jinliang Wei and
Garth Gibson and
Alexandra Fedorova and
Gennady Pekhimenko},
editor = {Ameet Talwalkar and
Virginia Smith and
Matei Zaharia},
title = {Priority-based Parameter Propagation for Distributed {DNN} Training},
booktitle = {Proceedings of Machine Learning and Systems 2019, MLSys 2019, Stanford,
CA, USA, March 31 - April 2, 2019},
publisher = {mlsys.org},
year = {2019},
url = {https://proceedings.mlsys.org/book/283.pdf},
timestamp = {Thu, 18 Jun 2020 15:48:01 +0200},
biburl = {https://dblp.org/rec/conf/mlsys/JayarajanWGFP19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
StreamBox-HBM: Stream Analytics on High Bandwidth Hybrid Memory
BibTeX
Hongyu Miao, Myeongjae Jeon, Gennady Pekhimenko, Kathryn S. McKinley, Felix Xiaozhu Lin
ASPLOS, April 2019
Hongyu Miao, Myeongjae Jeon, Gennady Pekhimenko, Kathryn S. McKinley, Felix Xiaozhu Lin
ASPLOS, April 2019
@inproceedings{UofTEcoSystem_StreamBox,
author = {Hongyu Miao and
Myeongjae Jeon and
Gennady Pekhimenko and
Kathryn S. McKinley and
Felix Xiaozhu Lin},
editor = {Iris Bahar and
Maurice Herlihy and
Emmett Witchel and
Alvin R. Lebeck},
title = {{StreamBox-HBM}: Stream Analytics on High Bandwidth Hybrid Memory},
booktitle = {Proceedings of the Twenty-Fourth International Conference on Architectural
Support for Programming Languages and Operating Systems, {ASPLOS}
2019, Providence, RI, USA, April 13-17, 2019},
pages = {167--181},
publisher = {{ACM}},
year = {2019},
url = {https://doi.org/10.1145/3297858.3304031},
doi = {10.1145/3297858.3304031},
timestamp = {Tue, 09 Feb 2021 13:47:47 +0100},
biburl = {https://dblp.org/rec/conf/asplos/MiaoJPML19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
EcoRNN: Efficient Computing of LSTM RNN on GPUs
BibTeX
Bojian Zheng, Gennady Pekhimenko
MICRO ACM Student Research Competition, October 2018
Third Place in ACM Student Research Competition
Bojian Zheng, Gennady Pekhimenko
MICRO ACM Student Research Competition, October 2018
Third Place in ACM Student Research Competition
@online{UofTEcoSystem_EcoRNN,
author = {Bojian Zheng and
Gennady Pekhimenko},
title = {{EcoRNN}: Efficient Computing of LSTM RNN on GPUs},
year = {2018},
url = {https://www.microarch.org/micro51/SRC/posters/20_zheng.pdf}
}
Benchmarking and Analyzing Deep Neural Network Training
BibTeX
Hongyu Zhu, Mohamed Akrout, Bojian Zheng, Andrew Pelegris, Amar Phanishayee, Bianca Schroeder, Gennady Pekhimenko
IISWC, July 2018
Hongyu Zhu, Mohamed Akrout, Bojian Zheng, Andrew Pelegris, Amar Phanishayee, Bianca Schroeder, Gennady Pekhimenko
IISWC, July 2018
@inproceedings{UofTEcoSystem_TBD_IISWC,
author = {Hongyu Zhu and
Mohamed Akrout and
Bojian Zheng and
Andrew Pelegris and
Anand Jayarajan and
Amar Phanishayee and
Bianca Schroeder and
Gennady Pekhimenko},
title = {Benchmarking and Analyzing Deep Neural Network Training},
booktitle = {2018 {IEEE} International Symposium on Workload Characterization,
{IISWC} 2018, Raleigh, NC, USA, September 30 - October 2, 2018},
pages = {88--100},
publisher = {{IEEE} Computer Society},
year = {2018},
url = {https://doi.org/10.1109/IISWC.2018.8573476},
doi = {10.1109/IISWC.2018.8573476},
timestamp = {Wed, 16 Oct 2019 14:14:56 +0200},
biburl = {https://dblp.org/rec/conf/iiswc/ZhuAZPJPSP18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
TerseCades: Efficient Data Compression in Stream Processing
BibTeX
Gennady Pekhimenko, Chuanxiong Guo, Myeongjae Jeon, Ryan Huang, and Lidong Zhou
USENIX Annual Technical Conference, July 2018
Gennady Pekhimenko, Chuanxiong Guo, Myeongjae Jeon, Ryan Huang, and Lidong Zhou
USENIX Annual Technical Conference, July 2018
@inproceedings{UofTEcoSystem_TerseCades,
author = {Gennady Pekhimenko and
Chuanxiong Guo and
Myeongjae Jeon and
Peng Huang and
Lidong Zhou},
editor = {Haryadi S. Gunawi and
Benjamin Reed},
title = {{TerseCades}: Efficient Data Compression in Stream Processing},
booktitle = {2018 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2018, Boston,
MA, USA, July 11-13, 2018},
pages = {307--320},
publisher = {{USENIX} Association},
year = {2018},
url = {https://www.usenix.org/conference/atc18/presentation/pekhimenko},
timestamp = {Mon, 01 Feb 2021 08:43:54 +0100},
biburl = {https://dblp.org/rec/conf/usenix/PekhimenkoGJHZ18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Gist: Efficient Data Encoding for Deep Neural Network Training
BibTeX
Animesh Jain, Amar Phanishayee, Jason Mars, Lingjia Tang, Gennady Pekhimenko
ISCA, June 2018
Animesh Jain, Amar Phanishayee, Jason Mars, Lingjia Tang, Gennady Pekhimenko
ISCA, June 2018
@inproceedings{UofTEcoSystem_Gist,
author = {Animesh Jain and
Amar Phanishayee and
Jason Mars and
Lingjia Tang and
Gennady Pekhimenko},
editor = {Murali Annavaram and
Timothy Mark Pinkston and
Babak Falsafi},
title = {{Gist}: Efficient Data Encoding for Deep Neural Network Training},
booktitle = {45th {ACM/IEEE} Annual International Symposium on Computer Architecture,
{ISCA} 2018, Los Angeles, CA, USA, June 1-6, 2018},
pages = {776--789},
publisher = {{IEEE} Computer Society},
year = {2018},
url = {https://doi.org/10.1109/ISCA.2018.00070},
doi = {10.1109/ISCA.2018.00070},
timestamp = {Sun, 10 May 2020 21:12:50 +0200},
biburl = {https://dblp.org/rec/conf/isca/JainPMTP18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
A Case for Richer Cross-layer Abstractions: Bridging the Semantic Gap to Enhance Memory Optimization
BibTeX
Nandita Vijaykumar, Abhilasha Jain, Diptesh Majumdar, Kevin Hsieh, Gennady Pekhimenko, Eiman Ebrahimi, Nastaran Hajinazaran, Phillip B. Gibbons, Onur Mutlu
ISCA, June 2018
Nandita Vijaykumar, Abhilasha Jain, Diptesh Majumdar, Kevin Hsieh, Gennady Pekhimenko, Eiman Ebrahimi, Nastaran Hajinazaran, Phillip B. Gibbons, Onur Mutlu
ISCA, June 2018
@inproceedings{UofTEcoSystem_XMem,
author = {Nandita Vijaykumar and
Abhilasha Jain and
Diptesh Majumdar and
Kevin Hsieh and
Gennady Pekhimenko and
Eiman Ebrahimi and
Nastaran Hajinazar and
Phillip B. Gibbons and
Onur Mutlu},
editor = {Murali Annavaram and
Timothy Mark Pinkston and
Babak Falsafi},
title = {A Case for Richer Cross-Layer Abstractions: Bridging the Semantic
Gap with Expressive Memory},
booktitle = {45th {ACM/IEEE} Annual International Symposium on Computer Architecture,
{ISCA} 2018, Los Angeles, CA, USA, June 1-6, 2018},
pages = {207--220},
publisher = {{IEEE} Computer Society},
year = {2018},
url = {https://doi.org/10.1109/ISCA.2018.00027},
doi = {10.1109/ISCA.2018.00027},
timestamp = {Sun, 10 May 2020 21:12:50 +0200},
biburl = {https://dblp.org/rec/conf/isca/VijaykumarJMHPE18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
TBD: Benchmarking and Analyzing Deep Neural Network Training
BibTeX
Hongyu Zhu, Mohamed Akrout, Bojian Zheng, Andrew Pelegris, Amar Phanishayee, Bianca Schroeder, Gennady Pekhimenko
arXiv, March 2018
Hongyu Zhu, Mohamed Akrout, Bojian Zheng, Andrew Pelegris, Amar Phanishayee, Bianca Schroeder, Gennady Pekhimenko
arXiv, March 2018
@article{UofTEcoSystem_TBD_arXiv,
author = {Hongyu Zhu and
Mohamed Akrout and
Bojian Zheng and
Andrew Pelegris and
Amar Phanishayee and
Bianca Schroeder and
Gennady Pekhimenko},
title = {{TBD}: Benchmarking and Analyzing Deep Neural Network Training},
journal = {CoRR},
volume = {abs/1803.06905},
year = {2018},
url = {http://arxiv.org/abs/1803.06905},
archivePrefix = {arXiv},
eprint = {1803.06905},
timestamp = {Mon, 13 Aug 2018 16:46:27 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-1803-06905.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
DNN-Train: Benchmarking and Analyzing DNN Training
BibTeX
Hongyu Zhu, Bojian Zheng, Amar Phanishayee, Bianca Schroeder, Gennady Pekhimenko
SysML Conference, February 2018
Hongyu Zhu, Bojian Zheng, Amar Phanishayee, Bianca Schroeder, Gennady Pekhimenko
SysML Conference, February 2018
@online{UofTEcoSystem_TBD_MLSys,
author = {Hongyu Zhu and
Bojian Zheng and
Amar Phanishayee and
Bianca Schroeder and
Gennady Pekhimenko},
title = {{DNN-Train}: Benchmarking and Analyzing DNN Training},
year = {2018},
url = {https://mlsys.org/Conferences/doc/2018/167.pdf}
}
StreamBox: Modern Stream Processing on a Multicore Machine
BibTeX
Hongyu Miao, Heejin Park, Myeongjae Jeon, Gennady Pekhimenko, Kathryn S. McKinley, Felix Xiaozhu Lin
USENIX Annual Technical Conference, July 2017
Hongyu Miao, Heejin Park, Myeongjae Jeon, Gennady Pekhimenko, Kathryn S. McKinley, Felix Xiaozhu Lin
USENIX Annual Technical Conference, July 2017
@inproceedings{UofTEcoSystem_Streambox,
author = {Hongyu Miao and
Heejin Park and
Myeongjae Jeon and
Gennady Pekhimenko and
Kathryn S. McKinley and
Felix Xiaozhu Lin},
editor = {Dilma Da Silva and
Bryan Ford},
title = {{StreamBox}: Modern Stream Processing on a Multicore Machine},
booktitle = {2017 {USENIX} Annual Technical Conference, {USENIX} {ATC} 2017, Santa
Clara, CA, USA, July 12-14, 2017},
pages = {617--629},
publisher = {{USENIX} Association},
year = {2017},
url = {https://www.usenix.org/conference/atc17/technical-sessions/presentation/miao},
timestamp = {Tue, 09 Feb 2021 13:47:51 +0100},
biburl = {https://dblp.org/rec/conf/usenix/MiaoPJPML17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Design-Induced Latency Variation in Modern DRAM Chips: Characterization, Analysis, and Latency Reduction Mechanisms
BibTeX
Donghyuk Lee, Samira Khan, Lavanya Subramanian, Saugata Ghose, Rachata Ausavarungnirun, Gennady Pekhimenko, Vivek Seshadri, Onur Mutlu
SIGMETRICS, June 2017
Donghyuk Lee, Samira Khan, Lavanya Subramanian, Saugata Ghose, Rachata Ausavarungnirun, Gennady Pekhimenko, Vivek Seshadri, Onur Mutlu
SIGMETRICS, June 2017
@article{UofTEcoSystem_DIVA,
author = {Donghyuk Lee and
Samira Manabi Khan and
Lavanya Subramanian and
Saugata Ghose and
Rachata Ausavarungnirun and
Gennady Pekhimenko and
Vivek Seshadri and
Onur Mutlu},
title = {Design-Induced Latency Variation in Modern {DRAM} Chips: Characterization,
Analysis, and Latency Reduction Mechanisms},
journal = {Proceedings of the ACM on Measurement and Analysis of Computing Systems},
volume = {1},
number = {1},
pages = {26:1--26:36},
year = {2017},
url = {https://doi.org/10.1145/3084464},
doi = {10.1145/3084464},
timestamp = {Thu, 09 Jul 2020 22:58:52 +0200},
biburl = {https://dblp.org/rec/journals/pomacs/LeeKSGAPSM17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
SoftMC: A Flexible and Practical Open-Source Infrastructure for Enabling Experimental DRAM Studies
BibTeX
Hasan Hassan, Nandita Vijaykumar, Samira Khan, Saugata Ghose, Kevin Chang, Gennady Pekhimenko, Donghyuk Lee, Oguz Ergin, Onur Mutlu
HPCA-23, February 2017
Hasan Hassan, Nandita Vijaykumar, Samira Khan, Saugata Ghose, Kevin Chang, Gennady Pekhimenko, Donghyuk Lee, Oguz Ergin, Onur Mutlu
HPCA-23, February 2017
@article{UofTEcoSystem_SoftMC,
author = {Hasan Hassan and
Nandita Vijaykumar and
Samira Manabi Khan and
Saugata Ghose and
Kevin K. Chang and
Gennady Pekhimenko and
Donghyuk Lee and
Oguz Ergin and
Onur Mutlu},
title = {{SoftMC}: Practical {DRAM} Characterization Using an FPGA-Based Infrastructure},
journal = {CoRR},
volume = {abs/1805.03195},
year = {2018},
url = {http://arxiv.org/abs/1805.03195},
archivePrefix = {arXiv},
eprint = {1805.03195},
timestamp = {Mon, 13 Aug 2018 16:46:07 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-1805-03195.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}