


default search action
BibTeX record journals/corr/abs-2402-09748
@article{DBLP:journals/corr/abs-2402-09748, author = {Wenxiao Wang and Wei Chen and Yicong Luo and Yongliu Long and Zhengkai Lin and Liye Zhang and Binbin Lin and Deng Cai and Xiaofei He}, title = {Model Compression and Efficient Inference for Large Language Models: {A} Survey}, journal = {CoRR}, volume = {abs/2402.09748}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.09748}, doi = {10.48550/ARXIV.2402.09748}, eprinttype = {arXiv}, eprint = {2402.09748}, timestamp = {Thu, 25 Jul 2024 07:47:44 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-09748.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }

manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.