mirror of
https://github.com/harvard-edge/cs249r_book.git
synced 2026-03-11 17:49:25 -05:00
Simplify title and fix bibliography entry types
- Remove "Tensors to Systems" from subtitle for cleaner title - Fix @article entries that should be @inproceedings (kannan2022astrasim, micikevicius2018mixed, strubell2019energy, vaswani2017attention) - Remove duplicate booktitle field from williams2009roofline - Standardize year fields across entries
This commit is contained in:
@@ -218,7 +218,7 @@
|
||||
% Title and authors - improved typography
|
||||
\title{
|
||||
\Huge\bfseries Tiny\emoji{fire}Torch\\[0.4em]
|
||||
\Large\normalfont\itshape Building Machine Learning Systems from First Principles: Tensors to Systems
|
||||
\Large\normalfont\itshape Building Machine Learning Systems from First Principles
|
||||
}
|
||||
\author{
|
||||
\fontsize{12}{15}\selectfont
|
||||
|
||||
@@ -233,24 +233,13 @@
|
||||
note = {RISC-V edition, used in MIT 6.S081},
|
||||
}
|
||||
|
||||
@article{kannan2022astrasim,
|
||||
title = {
|
||||
ASTRA-sim2.0: Modeling Hierarchical Networks and Disaggregated Systems for Large-model Training
|
||||
at Scale
|
||||
},
|
||||
author = {
|
||||
Won, William and Heo, Taekyung and Rashidi, Saeed and Sridharan, Srinivas and Srinivasan,
|
||||
Sudarshan and Krishna, Tushar
|
||||
},
|
||||
booktitle = {
|
||||
Proceedings of the 2023 IEEE International Symposium on Performance Analysis of Systems and
|
||||
Software (ISPASS)
|
||||
},
|
||||
@inproceedings{kannan2022astrasim,
|
||||
title = {ASTRA-sim2.0: Modeling Hierarchical Networks and Disaggregated Systems for Large-model Training at Scale},
|
||||
author = {Won, William and Heo, Taekyung and Rashidi, Saeed and Sridharan, Srinivas and Srinivasan, Sudarshan and Krishna, Tushar},
|
||||
booktitle = {Proceedings of the 2023 IEEE International Symposium on Performance Analysis of Systems and Software (ISPASS)},
|
||||
year = {2023},
|
||||
doi = {10.1109/ISPASS57527.2023.00035},
|
||||
url = {http://arxiv.org/abs/2303.14006v1},
|
||||
date = {2023-03-24},
|
||||
primaryclass = {cs.DC},
|
||||
archiveprefix = {arXiv},
|
||||
}
|
||||
|
||||
@article{kapur2008productive,
|
||||
@@ -381,18 +370,12 @@
|
||||
editor = {Rust, C.},
|
||||
}
|
||||
|
||||
@article{micikevicius2018mixed,
|
||||
@inproceedings{micikevicius2018mixed,
|
||||
title = {Mixed Precision Training},
|
||||
author = {
|
||||
Micikevicius, Paulius and Narang, Sharan and Alben, Jonah and Diamos, Gregory and Elsen, Erich
|
||||
and Garcia, David and Ginsburg, Boris and Houston, Michael and Kuchaiev, Oleksii and Venkatesh,
|
||||
Ganesh and Wu, Hao
|
||||
},
|
||||
author = {Micikevicius, Paulius and Narang, Sharan and Alben, Jonah and Diamos, Gregory and Elsen, Erich and Garcia, David and Ginsburg, Boris and Houston, Michael and Kuchaiev, Oleksii and Venkatesh, Ganesh and Wu, Hao},
|
||||
booktitle = {International Conference on Learning Representations},
|
||||
year = {2018},
|
||||
url = {http://arxiv.org/abs/1710.03740v3},
|
||||
date = {2017-10-10},
|
||||
primaryclass = {cs.AI},
|
||||
archiveprefix = {arXiv},
|
||||
}
|
||||
|
||||
@book{mlsysbook2025,
|
||||
@@ -594,17 +577,15 @@
|
||||
url = {https://minitorch.github.io/},
|
||||
}
|
||||
|
||||
@article{strubell2019energy,
|
||||
@inproceedings{strubell2019energy,
|
||||
title = {Energy and Policy Considerations for Deep Learning in NLP},
|
||||
author = {Strubell, Emma and Ganesh, Ananya and McCallum, Andrew},
|
||||
booktitle = {Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics},
|
||||
year = {2019},
|
||||
publisher = {Association for Computational Linguistics},
|
||||
address = {Florence, Italy},
|
||||
pages = {3645--3650},
|
||||
url = {http://arxiv.org/abs/1906.02243v1},
|
||||
date = {2019-06-05},
|
||||
primaryclass = {cs.CL},
|
||||
archiveprefix = {arXiv},
|
||||
}
|
||||
|
||||
@misc{sutton2019bitter,
|
||||
@@ -658,19 +639,14 @@
|
||||
pages = {155--161},
|
||||
}
|
||||
|
||||
@article{vaswani2017attention,
|
||||
@inproceedings{vaswani2017attention,
|
||||
title = {Attention Is All You Need},
|
||||
author = {
|
||||
Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and
|
||||
Gomez, Aidan N. and Kaiser, Lukasz and Polosukhin, Illia
|
||||
},
|
||||
author = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N. and Kaiser, Lukasz and Polosukhin, Illia},
|
||||
booktitle = {Advances in Neural Information Processing Systems},
|
||||
year = {2017},
|
||||
volume = {30},
|
||||
pages = {5998--6008},
|
||||
url = {http://arxiv.org/abs/1706.03762v7},
|
||||
date = {2017-06-12},
|
||||
primaryclass = {cs.CL},
|
||||
archiveprefix = {arXiv},
|
||||
}
|
||||
|
||||
@book{vygotsky1978mind,
|
||||
@@ -685,20 +661,15 @@
|
||||
}
|
||||
|
||||
@article{williams2009roofline,
|
||||
title = {Roofline},
|
||||
title = {Roofline: An Insightful Visual Performance Model for Multicore Architectures},
|
||||
author = {Williams, Samuel and Waterman, Andrew and Patterson, David},
|
||||
journal = {Communications of the ACM},
|
||||
booktitle = {Communications of the ACM},
|
||||
publisher = {Association for Computing Machinery (ACM)},
|
||||
year = {2009},
|
||||
volume = {52},
|
||||
number = {4},
|
||||
pages = {65--76},
|
||||
doi = {10.1145/1498765.1498785},
|
||||
issn = {0001-0782,1557-7317},
|
||||
url = {https://doi.org/10.1145/1498765.1498785},
|
||||
source = {Crossref},
|
||||
subtitle = {an insightful visual performance model for multicore architectures},
|
||||
date = {2009-04},
|
||||
publisher = {Association for Computing Machinery (ACM)},
|
||||
}
|
||||
|
||||
@article{zhang2021dive,
|
||||
|
||||
Reference in New Issue
Block a user