{"version.version":"0.0.7","version.cm_url":"https://github.com/ceurws/ceur-spt","spt.html_url":"/Vol-4112/68_main_long.html","spt.description":null,"spt.id":"Vol-4112/68_main_long","spt.wikidataid":null,"spt.title":"Easy to Complete, Hard to Choose: Investigating LLM Performance on the ProverbIT Benchmark","spt.pdfUrl":"https://ceur-ws.org/Vol-4112/68_main_long.pdf","spt.volume":{"number":4112,"acronym":"CLiC-it 2025","wikidataid":null,"title":"Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)","description":null,"url":null,"date":"2025-11-30","dblp":null,"k10plus":null,"urn":null},"spt.session":null,"cvb.id":"Vol-4112/68_main_long","cvb.title":"Easy to Complete, Hard to Choose: Investigating LLM Performance on the ProverbIT Benchmark","cvb.type":null,"cvb.position":null,"cvb.pagesFrom":null,"cvb.pagesTo":null,"cvb.authors":"Enrico Mensa,Lorenzo Zane,Calogero Jerik Scozzaro,Matteo Delsanto,Tommaso Milani,Daniele P. Radicioni","cvb.vol_number":"4112","cvb.pdf_name":"68_main_long.pdf","cvb.pages":null,"cvb.fail":null}