<?xml version="1.0" encoding="US-ASCII"?>
<dblp>
<inproceedings key="conf/mlsys/0002TTYCWXDG024" mdate="2025-08-05">
<author>Ji Lin 0002</author>
<author>Jiaming Tang</author>
<author>Haotian Tang</author>
<author>Shang Yang</author>
<author>Wei-Ming Chen</author>
<author>Wei-Chen Wang 0002</author>
<author>Guangxuan Xiao</author>
<author>Xingyu Dang</author>
<author>Chuang Gan 0001</author>
<author>Song Han 0003</author>
<title>AWQ: Activation-aware Weight Quantization for On-Device LLM Compression and Acceleration.</title>
<year>2024</year>
<booktitle>MLSys</booktitle>
<ee type="oa">https://proceedings.mlsys.org/paper_files/paper/2024/hash/42a452cbafa9dd64e9ba4aa95cc1ef21-Abstract-Conference.html</ee>
<crossref>conf/mlsys/2024</crossref>
<url>db/conf/mlsys/mlsys2024.html#0002TTYCWXDG024</url>
</inproceedings>
</dblp>
