@inproceedings{mx+,author={Lee, Jungi and Park, Junyong and Cha, Soohyun and Cho, Jaehoon and Sim, Jaewoong},title={MX+: Pushing the Limits of Microscaling Formats for Efficient Large Language Model Serving},year={2025},booktitle={Proceedings of the 58th Annual International Symposium on Microarchitecture (MICRO)},location={Seoul, Korea},series={MICRO '25},}
2024
DAC ’24
MoNDE: Mixture of Near-Data Experts for Large-Scale Sparse Models
Taehyun Kim , Kwanseok Choi , Youngmock Cho , Jaehoon Cho, Hyuk-Jae Lee , and Jaewoong Sim
In Proceedings of the 61st ACM/IEEE Design Automation Conference , San Francisco, CA, USA, 2024
@inproceedings{monde,author={Kim, Taehyun and Choi, Kwanseok and Cho, Youngmock and Cho, Jaehoon and Lee, Hyuk-Jae and Sim, Jaewoong},title={MoNDE: Mixture of Near-Data Experts for Large-Scale Sparse Models},year={2024},booktitle={Proceedings of the 61st ACM/IEEE Design Automation Conference},location={San Francisco, CA, USA},series={DAC '24},}