@inproceedings{ author={Tim Dettmers and Ruslan A. Svirschevski and Vage Egiazarian and Denis Kuznedelev and Elias Frantar and Saleh Ashkboos and Alexander Borzunov and Torsten Hoefler and Dan Alistarh}, title={{SpQR: A Sparse-Quantized Representation for Near-Lossless LLM Weight Compression}}, year={2024}, month={May}, booktitle={The Twelfth International Conference on Learning Representations}, doi={10.48550/arXiv.2306.03078}, }