BibTeX Export of Author::Mazaheri
@INPROCEEDINGS{butler_ea_2024_SC, author = {Butler, Branden and Yu, Sixing and Mazaheri, Arya and Jannesari, Ali}, month = nov, title = {PipeInfer: Accelerating LLM Inference using Asynchronous Pipelined Speculation}, booktitle = {Proc. of the International Conference for High Performance Computing, Networking, Storage, and Analysis (SC), Atlanta, GA, USA}, year = {2024}, pages = {1--13}, note = {(accepted)} } @INPROCEEDINGS{beringer_ea_ICPP_2024, author = {Beringer, Tim and Stock, Jakob and Mazaheri, Arya and Wolf, Felix}, month = aug, title = {Dissecting Convolutional Neural Networks for Runtime and Scalability Prediction}, booktitle = {Proc. of the 53st International Conference on Parallel Processing (ICPP), Gotland, Sweden}, year = {2024}, pages = {168--178}, publisher = {ACM}, isbn = {979-8-4007-1793-2}, doi = {10.1145/3673038.3673107} } @INPROCEEDINGS{oezden_ea:2022:icpp, author = {{\"{O}}zden, Taylan and Beringer, Tim and Mazaheri, Arya and Fard, Hamid Mohammadi and Wolf, Felix}, keywords = {adaptive job scheduling, batch systems, malleable workloads, resource management, simulations}, month = aug, title = {ElastiSim: A Batch-System Simulator for Malleable Workloads}, booktitle = {Proc. of the 51st International Conference on Parallel Processing (ICPP), Bordeaux, France}, year = {2022}, pages = {1--11}, publisher = {ACM}, isbn = {9781450397339}, doi = {10.1145/3545008.3545046} } @INPROCEEDINGS{yu_ea:2022:icml, author = {Yu, Sixing and Mazaheri, Arya and Jannesari, Ali}, keywords = {deep learning, network pruning, reinforcement learning}, month = jul, title = {Topology-Aware Network Pruning using Multi-stage Graph Embedding and Reinforcement Learning}, booktitle = {Proc. of the 39th International Conference on Machine Learning (ICML), Baltimore, Maryland, USA}, series = {Proceedings of Machine Learning Research}, volume = {162}, year = {2022}, pages = {25656--25667}, publisher = {PMLR}, url = {} } @PHDTHESIS{mazaheri:diss:2022, author = {Mazaheri, Arya}, month = apr, title = {Performance engineering of data-intensive applications}, type = {Dissertation}, year = {2022}, school = {Technische Universit{\"{a}}t Darmstadt}, address = {Darmstadt, Germany}, url = {}, doi = {10.26083/tuprints-00021078} } @INPROCEEDINGS{yu_ea:2021:iccv, author = {Yu, Sixing and Mazaheri, Arya and Jannesari, Ali}, keywords = {deep learning, network pruning, reinforcement learning}, month = oct, title = {Auto Graph Encoder-Decoder for Neural Network Pruning}, booktitle = {Proc. of the IEEE/CVF International Conference on Computer Vision (ICCV), Montreal, Canada}, year = {2021}, pages = {6362--6372}, publisher = {IEEE/CVF}, url = {} } @INPROCEEDINGS{haehnle_ea:2020:isola, author = {H{\"{a}}hnle, Reiner and Heydari Tabar, Asmae and Mazaheri, Arya and Norouzi, Mohammad and Steinh{\"{o}}fel, Dominic and Wolf, Felix}, editor = {Margaria, Tiziana and Steffen, Bernhard}, title = {Safer Parallelization}, booktitle = {Proc. of the 9th International Symposium On Leveraging Applications of Formal Methods, Verification and Validation: Engineering Principles. ISoLA 2020, Rhodes, Greece}, series = {Lecture Notes in Computer Science}, volume = {1477}, year = {2020}, pages = {117--137}, publisher = {Springer}, issn = {978-3-030-61470-6}, doi = {10.1007/978-3-030-61470-6_8} } @INPROCEEDINGS{schrammel_ea:euro-par:2020, author = {Schrammel, Fabian and Renk, Florian and Mazaheri, Arya and Wolf, Felix}, month = aug, title = {Efficient Ephemeris Models for Spacecraft Trajectory Simulations on {GPU}s}, booktitle = {Proc. of the 26th Euro-Par Conference, Warsaw, Poland}, series = {Lecture Notes in Computer Science}, volume = {12247}, year = {2020}, pages = {561--577}, publisher = {Springer}, isbn = {978-3-030-57674-5}, doi = {10.1007/978-3-030-57675-2_35} } @INPROCEEDINGS{mazaheri_ea:2020:eurosys, author = {Mazaheri, Arya and Beringer, Tim and Moskewicz, Matthew and Wolf, Felix and Jannesari, Ali}, keywords = {deep learning, meta-programming, symbolic computation, winograd convolution}, month = apr, title = {Accelerating {W}inograd Convolutions using Symbolic Computation and Meta-programming}, booktitle = {Proc. of the 15th EuroSys Conference, Heraklion, Crete, Greece}, number = {40}, year = {2020}, pages = {1--14}, publisher = {ACM}, isbn = {978-1-45036-882-7}, doi = {10.1145/3342195.3387549} } @INPROCEEDINGS{mazaheri_ea:euro-par:2019, author = {Mazaheri, Arya and Schulte, Johannes and Moskewicz, Matthew and Wolf, Felix and Jannesari, Ali}, month = aug, title = {Enhancing the Programmability and Performance Portability of {GPU} Tensor Operations}, booktitle = {Proc. of the 25th Euro-Par Conference, G{\"{o}}ttingen, Germany}, series = {Lecture Notes in Computer Science}, volume = {11725}, year = {2019}, pages = {213--226}, publisher = {Springer}, note = {(best paper award)}, isbn = {978-3-030-29399-4}, doi = {10.1007/978-3-030-29400-7_16} } @INPROCEEDINGS{mazaheri2018unveiling, author = {Mazaheri, Arya and Wolf, Felix and Jannesari, Ali}, month = aug, title = {Unveiling Thread Communication Bottlenecks Using Hardware-Independent Metrics}, booktitle = {Proc. of the 47th International Conference on Parallel Processing (ICPP), Eugene, OR, USA}, year = {2018}, pages = {6:1--6:10}, organization = {ACM}, isbn = {978-1-4503-6510-9}, doi = {10.1145/3225058.3225142} } @INPROCEEDINGS{Mazaheri_et_al:2015:Comm_pattern_ICPP, author = {Mazaheri, Arya and Jannesari, Ali and Mirzaei, Abdolreza and Wolf, Felix}, month = sep, title = {Characterizing Loop-Level Communication Patterns in Shared Memory Applications}, booktitle = {Proc. of the 44th International Conference on Parallel Processing (ICPP), Beijing, China}, year = {2015}, pages = {759--768}, issn = {0190-3918}, doi = {10.1109/ICPP.2015.85} }