@inproceedings{liu24webbench, title = {WebBench: How Far Have Multimodal {LLM}s Evolved in Web Page Understanding and Grounding?}, author = {Junpeng Liu and Yifan Song and Bill Yuchen Lin and Wai Lam and Graham Neubig and Yuanzhi Li and Xiang Yue}, booktitle = {Conference on Language Modeling (COLM)}, address = {Philadelphia, USA}, month = {October}, url = {https://arxiv.org/abs/2404.05955}, year = {2024} }