@inproceedings{zhang2025beingvl0, title={From Pixels to Tokens: Byte-Pair Encoding on Quantized Visual Modalities}, author={Zhang, Wanpeng and Xie, Zilong and Feng, Yicheng and Li, Yijiang and Xing, Xingrun and Zheng, Sipeng and Lu, Zongqing}, booktitle={The Thirteenth International Conference on Learning Representations}, year={2025}, url={https://openreview.net/forum?id=3TnLGGHhNx} }