@inproceedings{inproceedings13b0a9ce, title = {Efficient LLMs with AMP: attention heads and MLP pruning}, author = {Mugnaini, Leandro Giusti and Yamamoto, Bruno Lopes and Alcantara, Lucas Lauton de and Zacarias, Victor and Bollis, Edson and Pellicer, Lucas Francisco Amaral Orosco and Reali Costa, Anna Helena and Correia, Artur Jordão Lima}, year = {2025}, doi = {10.1109/IJCNN64981.2025.11227985}, publisher = {IEEE}, booktitle = {International Joint Conference on Neural Networks} }