BibTeX Export of Organization::TUDarmstadt::Topic::DNN
@INPROCEEDINGS{butler_ea_2024_SC, author = {Butler, Branden and Yu, Sixing and Mazaheri, Arya and Jannesari, Ali}, month = nov, title = {PipeInfer: Accelerating LLM Inference using Asynchronous Pipelined Speculation}, booktitle = {Proc. of the International Conference for High Performance Computing, Networking, Storage, and Analysis (SC), Atlanta, GA, USA}, year = {2024}, pages = {1--13}, note = {(accepted)} } @INPROCEEDINGS{beringer_ea_ICPP_2024, author = {Beringer, Tim and Stock, Jakob and Mazaheri, Arya and Wolf, Felix}, month = aug, title = {Dissecting Convolutional Neural Networks for Runtime and Scalability Prediction}, booktitle = {Proc. of the 53st International Conference on Parallel Processing (ICPP), Gotland, Sweden}, year = {2024}, pages = {168--178}, publisher = {ACM}, isbn = {979-8-4007-1793-2}, doi = {10.1145/3673038.3673107} } @INPROCEEDINGS{yu_ea:2022:icml, author = {Yu, Sixing and Mazaheri, Arya and Jannesari, Ali}, keywords = {deep learning, network pruning, reinforcement learning}, month = jul, title = {Topology-Aware Network Pruning using Multi-stage Graph Embedding and Reinforcement Learning}, booktitle = {Proc. of the 39th International Conference on Machine Learning (ICML), Baltimore, Maryland, USA}, series = {Proceedings of Machine Learning Research}, volume = {162}, year = {2022}, pages = {25656--25667}, publisher = {PMLR}, url = {} } @INPROCEEDINGS{mammadli_corl:SC:2020, author = {Mammadli, Rahim and Jannesari, Ali and Wolf, Felix}, month = nov, title = {Static Neural Compiler Optimization via Deep Reinforcement Learning}, booktitle = {Proc. of the 6th Workshop on the LLVM Compiler Infrastructure in HPC, held in conjunction with the Supercomputing Conference (SC20)}, year = {2020}, pages = {1--11}, publisher = {IEEE}, doi = {10.1109/LLVMHPCHiPar51896.2020.00006} } @INPROCEEDINGS{mazaheri_ea:2020:eurosys, author = {Mazaheri, Arya and Beringer, Tim and Moskewicz, Matthew and Wolf, Felix and Jannesari, Ali}, keywords = {deep learning, meta-programming, symbolic computation, winograd convolution}, month = apr, title = {Accelerating {W}inograd Convolutions using Symbolic Computation and Meta-programming}, booktitle = {Proc. of the 15th EuroSys Conference, Heraklion, Crete, Greece}, number = {40}, year = {2020}, pages = {1--14}, publisher = {ACM}, isbn = {978-1-45036-882-7}, doi = {10.1145/3342195.3387549} } @INPROCEEDINGS{mazaheri_ea:euro-par:2019, author = {Mazaheri, Arya and Schulte, Johannes and Moskewicz, Matthew and Wolf, Felix and Jannesari, Ali}, month = aug, title = {Enhancing the Programmability and Performance Portability of {GPU} Tensor Operations}, booktitle = {Proc. of the 25th Euro-Par Conference, G{\"{o}}ttingen, Germany}, series = {Lecture Notes in Computer Science}, volume = {11725}, year = {2019}, pages = {213--226}, publisher = {Springer}, note = {(best paper award)}, isbn = {978-3-030-29399-4}, doi = {10.1007/978-3-030-29400-7_16} } @ARTICLE{mammadli_ea:taco:2019, author = {Mammadli, Rahim and Wolf, Felix and Jannesari, Ali}, month = jan, title = {The Art of Getting Deep Neural Networks in Shape}, journal = {ACM Transactions on Architecture and Code Optimization (TACO)}, volume = {15}, number = {4}, year = {2019}, pages = {62:1--62:21}, issn = {1544-3566}, doi = {10.1145/3291053} }