{"id":"https://openalex.org/W7163998326","doi":"https://doi.org/10.1145/3748522.3779736","title":"ICICLE: An Interactive VLM-based System for Information Extraction from Ambiguous Engineering Diagram Legends","display_name":"ICICLE: An Interactive VLM-based System for Information Extraction from Ambiguous Engineering Diagram Legends","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7163998326","doi":"https://doi.org/10.1145/3748522.3779736"},"language":null,"primary_location":{"id":"doi:10.1145/3748522.3779736","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3748522.3779736","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 41st ACM/SIGAPP Symposium on Applied Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3748522.3779736","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077592011","display_name":"Vasil Shteriyanov","orcid":"https://orcid.org/0009-0006-2515-6951"},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Vasil Shteriyanov","raw_affiliation_strings":["Mathematics and Computer Science, Eindhoven University of Technology, Eindhoven, Netherlands"],"raw_orcid":"https://orcid.org/0009-0006-2515-6951","affiliations":[{"raw_affiliation_string":"Mathematics and Computer Science, Eindhoven University of Technology, Eindhoven, Netherlands","institution_ids":["https://openalex.org/I83019370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081486976","display_name":"\u0420\u0438\u043c\u043c\u0430 \u0414\u0436\u0443\u0441\u0443\u043f\u043e\u0432\u0430","orcid":"https://orcid.org/0000-0003-3411-4084"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rimma Dzhusupova","raw_affiliation_strings":["McDermott International, The Hague, Netherlands"],"raw_orcid":"https://orcid.org/0000-0003-3411-4084","affiliations":[{"raw_affiliation_string":"McDermott International, The Hague, Netherlands","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010170972","display_name":"Jan Bosch","orcid":"https://orcid.org/0000-0003-2854-722X"},"institutions":[{"id":"https://openalex.org/I66862912","display_name":"Chalmers University of Technology","ror":"https://ror.org/040wg7k59","country_code":"SE","type":"education","lineage":["https://openalex.org/I66862912"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Jan Bosch","raw_affiliation_strings":["Chalmers University of Technology, Gothenburg, Sweden"],"raw_orcid":"https://orcid.org/0000-0003-2854-722X","affiliations":[{"raw_affiliation_string":"Chalmers University of Technology, Gothenburg, Sweden","institution_ids":["https://openalex.org/I66862912"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5105368845","display_name":"\u00d6lsson","orcid":null},"institutions":[{"id":"https://openalex.org/I183111857","display_name":"Malm\u00f6 University","ror":"https://ror.org/05wp7an13","country_code":"SE","type":"education","lineage":["https://openalex.org/I183111857"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Helena Holmstr\u00f6m Olsson","raw_affiliation_strings":["Malmo University, Malmo, Sweden"],"raw_orcid":"https://orcid.org/0000-0002-7700-1816","affiliations":[{"raw_affiliation_string":"Malmo University, Malmo, Sweden","institution_ids":["https://openalex.org/I183111857"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5077592011"],"corresponding_institution_ids":["https://openalex.org/I83019370"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.95749053,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"798","last_page":"805"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.34610000252723694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.34610000252723694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11006","display_name":"BIM and Construction Integration","score":0.1216999962925911,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.07580000162124634,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5683000087738037},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.5317000150680542},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5246999859809875},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5072000026702881},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.49570000171661377},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4390999972820282},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.3783000111579895},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.3353999853134155}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7602999806404114},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5924999713897705},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5683000087738037},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.5317000150680542},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5246999859809875},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5072000026702881},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49900001287460327},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.49570000171661377},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4390999972820282},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.3783000111579895},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.3353999853134155},{"id":"https://openalex.org/C184408114","wikidata":"https://www.wikidata.org/wiki/Q1502022","display_name":"Generative Design","level":3,"score":0.32030001282691956},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.3179999887943268},{"id":"https://openalex.org/C2776411971","wikidata":"https://www.wikidata.org/wiki/Q17141398","display_name":"Sublanguage","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.29899999499320984},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2874000072479248},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C2777655017","wikidata":"https://www.wikidata.org/wiki/Q1501161","display_name":"Toolbox","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C180198813","wikidata":"https://www.wikidata.org/wiki/Q121182","display_name":"Information system","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25999999046325684},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25440001487731934},{"id":"https://openalex.org/C9354725","wikidata":"https://www.wikidata.org/wiki/Q286017","display_name":"Operationalization","level":2,"score":0.25369998812675476},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3748522.3779736","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3748522.3779736","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 41st ACM/SIGAPP Symposium on Applied Computing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3748522.3779736","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3748522.3779736","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 41st ACM/SIGAPP Symposium on Applied Computing","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.6855958700180054,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2001642682","https://openalex.org/W2605982830","https://openalex.org/W3036037642","https://openalex.org/W4283454975","https://openalex.org/W4387444376","https://openalex.org/W4390873481","https://openalex.org/W4390873795","https://openalex.org/W4390874575","https://openalex.org/W4400681686","https://openalex.org/W4402726948","https://openalex.org/W4402727137","https://openalex.org/W4406895099","https://openalex.org/W4409014148","https://openalex.org/W4414933810","https://openalex.org/W4416266451","https://openalex.org/W4416840107"],"related_works":[],"abstract_inverted_index":{"Engineering":[0],"legend":[1,113],"sheets":[2,114],"are":[3],"vital":[4],"in":[5,97,174],"Engineering,":[6],"Procurement,":[7],"and":[8,129,147],"Construction":[9],"(EPC)":[10],"projects,":[11,118],"visually":[12],"defining":[13],"complex":[14,170],"assemblies.":[15],"Automating":[16],"information":[17,171],"extraction":[18,122,172],"from":[19,115],"these":[20,54],"legends":[21],"can":[22],"significantly":[23],"reduce":[24],"manual":[25],"effort,":[26],"yet":[27],"their":[28],"spatially":[29],"ambiguous":[30],"layouts":[31],"pose":[32],"barriers":[33],"to":[34,90,126],"digital":[35],"transformation.":[36],"To":[37],"address":[38],"this,":[39],"we":[40],"introduce":[41],"ICICLE":[42,154],"(In-Context":[43],"Interactive":[44],"Cue-guided":[45],"Legend":[46],"Extractor),":[47],"a":[48,70,77,83,157,166],"Generative":[49,163],"AI":[50],"system":[51,102],"for":[52,152,161,168],"parsing":[53],"documents.":[55],"ICICLE's":[56],"core":[57],"innovation":[58],"is":[59,150],"the":[60,88,101,141],"In-Context":[61],"Multimodal":[62],"Annotation":[63],"Prompting":[64],"(ICMAP)":[65],"method.":[66],"This":[67,86],"technique":[68],"instructs":[69],"Vision":[71],"Language":[72],"Model":[73],"(VLM)":[74],"by":[75],"providing":[76],"single":[78],"annotated":[79],"visual":[80,98,134,145],"example":[81],"alongside":[82],"textual":[84,148],"prompt.":[85],"enables":[87],"VLM":[89],"ground":[91],"abstract":[92],"concepts":[93],"like":[94],"\"detailed":[95],"assembly\"":[96],"evidence,":[99],"making":[100],"adaptable":[103],"without":[104],"per-query":[105],"annotation":[106],"or":[107],"costly":[108],"model":[109],"retraining.":[110],"Validated":[111],"on":[112],"four":[116],"industrial":[117,176],"ICMAP":[119],"achieved":[120],"superior":[121],"accuracy":[123],"(96\u2013100%)":[124],"compared":[125],"established":[127],"alternatives":[128],"demonstrated":[130],"robustness":[131],"across":[132],"varied":[133],"examples.":[135],"An":[136],"ablation":[137],"study":[138,160],"confirms":[139],"that":[140],"tight":[142],"coupling":[143],"of":[144],"annotations":[146],"instructions":[149],"critical":[151],"success.":[153],"serves":[155],"as":[156],"successful":[158],"case":[159],"operationalizing":[162],"AI,":[164],"offering":[165],"blueprint":[167],"solving":[169],"tasks":[173],"challenging":[175],"domains.":[177]},"counts_by_year":[],"updated_date":"2026-06-10T14:10:52.464848","created_date":"2026-06-10T00:00:00"}
