@inproceedings{infinigen,author={Lee*, Wonbeom and Lee*, Jungi and Seo, Junghwan and Sim, Jaewoong},title={InfiniGen: Efficient Generative Inference of Large Language Models with Dynamic KV Cache Management},year={2024},booktitle={Proceedings of the 18th USENIX Symposium on Operating Systems Design and Implementation (OSDI)},series={OSDI '24},}
ISCA-51
Tender: Accelerating Large Language Models via Tensor Decompostion and Runtime Requantization
Jungi Lee*, Wonbeom Lee* , and Jaewoong Sim
In Proceedings of the 51st Annual International Symposium on Computer Architecture (ISCA) , Buenos Aires, Argentina, 2024
@inproceedings{tender,author={Lee*, Jungi and Lee*, Wonbeom and Sim, Jaewoong},title={Tender: Accelerating Large Language Models via Tensor Decompostion and Runtime Requantization},year={2024},booktitle={Proceedings of the 51st Annual International Symposium on Computer Architecture (ISCA)},series={ISCA '24},}
ASPLOS ’24
GSCore: Efficient Radiance Field Rendering via Architectural Support for 3D Gaussian Splatting
Junseo Lee , Seokwon Lee , Jungi Lee, Junyong Park , and Jaewoong Sim
In Proceedings of the 2024 International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS) , San Diego, CA, USA, 2024
@inproceedings{gscore,author={Lee, Junseo and Lee, Seokwon and Lee, Jungi and Park, Junyong and Sim, Jaewoong},title={GSCore: Efficient Radiance Field Rendering via Architectural Support for 3D Gaussian Splatting},year={2024},booktitle={Proceedings of the 2024 International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS)},series={ASPLOS '24},}
2023
ISCA-50
NeuRex: A Case for Neural Rendering Acceleration
Junseo Lee , Kwanseok Choi , Jungi Lee, Seokwon Lee , Joonho Whangbo , and Jaewoong Sim
In Proceedings of the 50th Annual International Symposium on Computer Architecture (ISCA) , Orlando, FL, USA, 2023
@inproceedings{neurex,author={Lee, Junseo and Choi, Kwanseok and Lee, Jungi and Lee, Seokwon and Whangbo, Joonho and Sim, Jaewoong},title={NeuRex: A Case for Neural Rendering Acceleration},year={2023},booktitle={Proceedings of the 50th Annual International Symposium on Computer Architecture (ISCA)},series={ISCA '23},}