{"id":"https://openalex.org/W7154684238","doi":"https://doi.org/10.48550/arxiv.2604.14448","title":"MARCA: A Checklist-Based Benchmark for Multilingual Web Search","display_name":"MARCA: A Checklist-Based Benchmark for Multilingual Web Search","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154684238","doi":"https://doi.org/10.48550/arxiv.2604.14448"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.14448","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14448","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.14448","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009573252","display_name":"Thales Sales Almeida","orcid":"https://orcid.org/0009-0006-9568-9331"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Almeida, Thales Sales","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092457173","display_name":"Giovana Kerche Bon\u00e1s","orcid":"https://orcid.org/0009-0001-9460-8353"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bon\u00e1s, Giovana Kerche","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086873271","display_name":"Ramon Pires","orcid":"https://orcid.org/0000-0002-0023-1971"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pires, Ramon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075320829","display_name":"Celio H. N. Larcher","orcid":"https://orcid.org/0000-0002-4861-6571"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Larcher, Celio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043191034","display_name":"Hugo Abonizio","orcid":"https://orcid.org/0000-0001-5208-0290"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abonizio, Hugo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045896508","display_name":"Marcos Piau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Piau, Marcos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Junior, Roseval Malaquias","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junior, Roseval Malaquias","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133852277","display_name":"Rodrigo Nogueira","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nogueira, Rodrigo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5036997454","display_name":"Thiago Laitz","orcid":"https://orcid.org/0000-0001-7205-2094"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Laitz, Thiago","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5009573252"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.44040000438690186,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.44040000438690186,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.22689999639987946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.14839999377727509,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7757999897003174},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5519999861717224},{"id":"https://openalex.org/keywords/rubric","display_name":"Rubric","score":0.4984999895095825},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.3971000015735626},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.3880000114440918},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.38769999146461487},{"id":"https://openalex.org/keywords/completeness","display_name":"Completeness (order theory)","score":0.385699987411499},{"id":"https://openalex.org/keywords/orchestration","display_name":"Orchestration","score":0.3587999939918518},{"id":"https://openalex.org/keywords/web-application","display_name":"Web application","score":0.34700000286102295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8033999800682068},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7757999897003174},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5519999861717224},{"id":"https://openalex.org/C111640148","wikidata":"https://www.wikidata.org/wiki/Q847349","display_name":"Rubric","level":2,"score":0.4984999895095825},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46779999136924744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4036000072956085},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.3971000015735626},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.3880000114440918},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.38769999146461487},{"id":"https://openalex.org/C17231256","wikidata":"https://www.wikidata.org/wiki/Q5156540","display_name":"Completeness (order theory)","level":2,"score":0.385699987411499},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36320000886917114},{"id":"https://openalex.org/C199168358","wikidata":"https://www.wikidata.org/wiki/Q3367000","display_name":"Orchestration","level":3,"score":0.3587999939918518},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35580000281333923},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3384999930858612},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.29510000348091125},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C166423231","wikidata":"https://www.wikidata.org/wiki/Q1891170","display_name":"Semantic search","level":3,"score":0.2791000008583069},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2678999900817871},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.2662000060081482},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C35578498","wikidata":"https://www.wikidata.org/wiki/Q193424","display_name":"Web service","level":2,"score":0.2549000084400177},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.25380000472068787},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.25220000743865967},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.14448","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14448","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.14448","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14448","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7912750840187073,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2,86,146],"(LLMs)":[3],"are":[4],"increasingly":[5],"used":[6],"as":[7],"sources":[8],"of":[9,64],"information,":[10],"yet":[11],"their":[12],"reliability":[13],"depends":[14],"on":[15,58],"the":[16,20],"ability":[17],"to":[18,150],"search":[19,97],"web,":[21],"select":[22],"relevant":[23],"evidence,":[24],"and":[25,34,40,52,81,98,100,120,140],"synthesize":[26],"complete":[27],"answers.":[28],"While":[29],"recent":[30],"benchmarks":[31],"evaluate":[32,84],"web-browsing":[33],"agentic":[35],"tool":[36],"use,":[37],"multilingual":[38],"settings,":[39],"Portuguese":[41],"in":[42,144],"particular,":[43],"remain":[44],"underexplored.":[45],"We":[46,83],"present":[47],"\\textsc{MARCA},":[48],"a":[49,91],"bilingual":[50],"(English":[51],"Portuguese)":[53],"benchmark":[54,153],"for":[55],"evaluating":[56],"LLMs":[57],"web-based":[59],"information":[60],"seeking.":[61],"\\textsc{MARCA}":[62],"consists":[63],"52":[65],"manually":[66,72],"authored":[67],"multi-entity":[68],"questions,":[69],"paired":[70],"with":[71,94,124],"validated":[73],"checklist-style":[74],"rubrics":[75],"that":[76,104,135],"explicitly":[77],"measure":[78],"answer":[79],"completeness":[80],"correctness.":[82],"14":[85],"under":[87],"two":[88],"interaction":[89],"settings:":[90],"Basic":[92],"framework":[93,103],"direct":[95],"web":[96],"scraping,":[99],"an":[101],"Orchestrator":[102],"enables":[105],"task":[106],"decomposition":[107],"via":[108],"delegated":[109],"subagents.":[110],"To":[111],"capture":[112],"stochasticity,":[113],"each":[114],"question":[115],"is":[116,122,154],"executed":[117],"multiple":[118],"times":[119],"performance":[121,132],"reported":[123],"run-level":[125],"uncertainty.":[126],"Across":[127],"models,":[128],"we":[129],"observe":[130],"large":[131],"differences,":[133],"find":[134],"orchestration":[136],"often":[137],"improves":[138],"coverage,":[139],"identify":[141],"substantial":[142],"variability":[143],"how":[145],"transfer":[147],"from":[148],"English":[149],"Portuguese.":[151],"The":[152],"available":[155],"at":[156],"https://github.com/maritaca-ai/MARCA":[157]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-04-18T00:00:00"}
