@inproceedings{Jain-SC24-PAL,author={Jain, Rutwik and Tran, Brandon and Chen, Keting and Sinclair, Matthew D. and Venkataraman, Shivaram},title={PAL: A Variability-Aware Policy for Scheduling ML Workloads in GPU Clusters},year={2024},isbn={9798350352917},publisher={IEEE Press},url={https://doi.org/10.1109/SC41406.2024.00032},doi={10.1109/SC41406.2024.00032},booktitle={Proceedings of the International Conference for High Performance Computing, Networking, Storage, and Analysis},articleno={26},numpages={18},keywords={Cluster Scheduling, GPGPU, Machine Learning, Performance Variability, Power Management},location={Atlanta, GA, USA},bibtex_show=true,selected=true,series={SC '24}}
2023
Fifty Years of the International Symposium on Computer Architecture: A Data-Driven Retrospective
Matthew D.
Sinclair, Parthasarathy
Ranganathan, Gaurang
Upasani, and
5 more authors
@article{Sinclair-Micro23-ISCA,author={Sinclair, Matthew D. and Ranganathan, Parthasarathy and Upasani, Gaurang and Sampson, Adrian and Patterson, David and Jain, Rutwik and Parthasarathy, Nidhi and Shah, Shaan},journal={IEEE Micro},title={Fifty Years of the International Symposium on Computer Architecture: A Data-Driven Retrospective},year={2023},volume={43},number={6},pages={109-124},keywords={},doi={10.1109/MM.2023.3324465},bibtex_show=true}
2022
Not All GPUs Are Created Equal: Characterizing Variability in Large-Scale, Accelerator-Rich Systems
Prasoon
Sinha, Akhil
Guliani, Rutwik
Jain, and
3 more authors
In SC22: International Conference for High Performance Computing, Networking, Storage and Analysis , Nov 2022
@inproceedings{Sinha-SC22-GPUVar,author={Sinha, Prasoon and Guliani, Akhil and Jain, Rutwik and Tran, Brandon and Sinclair, Matthew D. and Venkataraman, Shivaram},booktitle={ SC22: International Conference for High Performance Computing, Networking, Storage and Analysis },title={{ Not All GPUs Are Created Equal: Characterizing Variability in Large-Scale, Accelerator-Rich Systems }},year={2022},volume={},issn={},pages={1-15},doi={10.1109/SC41404.2022.00070},url={https://doi.ieeecomputersociety.org/10.1109/SC41404.2022.00070},publisher={IEEE Computer Society},address={Los Alamitos, CA, USA},bibtex_show=true,selected=true,month=nov}