BibTeX Export
@INPROCEEDINGS{butler_ea_2024_SC, author = {Butler, Branden and Yu, Sixing and Mazaheri, Arya and Jannesari, Ali}, month = nov, title = {PipeInfer: Accelerating LLM Inference using Asynchronous Pipelined Speculation}, booktitle = {Proc. of the International Conference for High Performance Computing, Networking, Storage, and Analysis (SC), Atlanta, GA, USA}, year = {2024}, pages = {1--13}, note = {(accepted)} }
Copy