{"id":"https://openalex.org/W4396674567","doi":"https://doi.org/10.3390/ijgi13050153","title":"Exploration of an Open Vocabulary Model on Semantic Segmentation for Street Scene Imagery","display_name":"Exploration of an Open Vocabulary Model on Semantic Segmentation for Street Scene Imagery","publication_year":2024,"publication_date":"2024-05-05","ids":{"openalex":"https://openalex.org/W4396674567","doi":"https://doi.org/10.3390/ijgi13050153"},"language":"en","primary_location":{"id":"doi:10.3390/ijgi13050153","is_oa":true,"landing_page_url":"https://doi.org/10.3390/ijgi13050153","pdf_url":"https://www.mdpi.com/2220-9964/13/5/153/pdf?version=1714902236","source":{"id":"https://openalex.org/S2764431341","display_name":"ISPRS International Journal of Geo-Information","issn_l":"2220-9964","issn":["2220-9964"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ISPRS International Journal of Geo-Information","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2220-9964/13/5/153/pdf?version=1714902236","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100599785","display_name":"Zichao Zeng","orcid":"https://orcid.org/0009-0002-8975-875X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Zichao Zeng","raw_affiliation_strings":["Department of Civil, Environmental and Geomatic Engineering, University College London, London WC1E 6BT, UK"],"affiliations":[{"raw_affiliation_string":"Department of Civil, Environmental and Geomatic Engineering, University College London, London WC1E 6BT, UK","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056951932","display_name":"J. Boehm","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jan Boehm","raw_affiliation_strings":["Department of Civil, Environmental and Geomatic Engineering, University College London, London WC1E 6BT, UK"],"affiliations":[{"raw_affiliation_string":"Department of Civil, Environmental and Geomatic Engineering, University College London, London WC1E 6BT, UK","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100599785"],"corresponding_institution_ids":["https://openalex.org/I45129253"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":1.4813,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.82710246,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"13","issue":"5","first_page":"153","last_page":"153"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.74283367395401},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6876115202903748},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6464142203330994},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5934783220291138},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5869725942611694},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5209399461746216},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5189720988273621},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.509070098400116},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4525274336338043},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39914795756340027},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.17411786317825317}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.74283367395401},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6876115202903748},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6464142203330994},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5934783220291138},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5869725942611694},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5209399461746216},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5189720988273621},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.509070098400116},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4525274336338043},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39914795756340027},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.17411786317825317},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/ijgi13050153","is_oa":true,"landing_page_url":"https://doi.org/10.3390/ijgi13050153","pdf_url":"https://www.mdpi.com/2220-9964/13/5/153/pdf?version=1714902236","source":{"id":"https://openalex.org/S2764431341","display_name":"ISPRS International Journal of Geo-Information","issn_l":"2220-9964","issn":["2220-9964"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ISPRS International Journal of Geo-Information","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:e0382054c13845228d526b9b0813bf12","is_oa":true,"landing_page_url":"https://doaj.org/article/e0382054c13845228d526b9b0813bf12","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISPRS International Journal of Geo-Information, Vol 13, Iss 5, p 153 (2024)","raw_type":"article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10191931","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/10191931/1/ijgi-13-00153.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"   ISPRS: International Journal of Geo-Information , 13  (5)    , Article 153. (2024)      ","raw_type":"Article"}],"best_oa_location":{"id":"doi:10.3390/ijgi13050153","is_oa":true,"landing_page_url":"https://doi.org/10.3390/ijgi13050153","pdf_url":"https://www.mdpi.com/2220-9964/13/5/153/pdf?version=1714902236","source":{"id":"https://openalex.org/S2764431341","display_name":"ISPRS International Journal of Geo-Information","issn_l":"2220-9964","issn":["2220-9964"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ISPRS International Journal of Geo-Information","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities","score":0.4699999988079071}],"awards":[{"id":"https://openalex.org/G2262934471","display_name":null,"funder_award_id":"EP/W522077/1","funder_id":"https://openalex.org/F4320314731","funder_display_name":"UK Research and Innovation"}],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4396674567.pdf"},"referenced_works_count":49,"referenced_works":["https://openalex.org/W1569892065","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W2031489346","https://openalex.org/W2340897893","https://openalex.org/W2412782625","https://openalex.org/W2487365028","https://openalex.org/W2508741746","https://openalex.org/W2560023338","https://openalex.org/W2743627947","https://openalex.org/W2804860796","https://openalex.org/W2810392541","https://openalex.org/W2884436604","https://openalex.org/W2886944874","https://openalex.org/W2890231632","https://openalex.org/W2892220819","https://openalex.org/W2920827956","https://openalex.org/W2957077982","https://openalex.org/W2963073398","https://openalex.org/W2963787264","https://openalex.org/W2963881378","https://openalex.org/W2964254867","https://openalex.org/W2964309882","https://openalex.org/W2970599025","https://openalex.org/W3008115128","https://openalex.org/W3035564946","https://openalex.org/W3046751713","https://openalex.org/W3047375952","https://openalex.org/W3102977943","https://openalex.org/W3134208490","https://openalex.org/W3135367836","https://openalex.org/W3159481202","https://openalex.org/W3173859428","https://openalex.org/W3175294391","https://openalex.org/W3195494505","https://openalex.org/W3217147624","https://openalex.org/W4205172069","https://openalex.org/W4226182655","https://openalex.org/W4312747482","https://openalex.org/W4312768455","https://openalex.org/W4312956471","https://openalex.org/W4313026212","https://openalex.org/W4318718936","https://openalex.org/W4319072188","https://openalex.org/W4367674957","https://openalex.org/W4386047746","https://openalex.org/W4388616070","https://openalex.org/W4390874575","https://openalex.org/W4393002303"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W4246352526","https://openalex.org/W2121910908","https://openalex.org/W915438175","https://openalex.org/W4230315250"],"abstract_inverted_index":{"This":[0,148],"study":[1,66,156],"investigates":[2],"the":[3,13,57,69,76],"efficacy":[4],"of":[5,16,71,78],"an":[6],"open":[7,160],"vocabulary,":[8],"multi-modal,":[9],"foundation":[10],"model":[11],"for":[12,37,152,184],"semantic":[14,172],"segmentation":[15,89],"images":[17],"from":[18],"complex":[19,188],"urban":[20],"street":[21],"scenes.":[22],"Unlike":[23],"traditional":[24],"models":[25,131,162],"reliant":[26],"on":[27,68],"predefined":[28],"category":[29,38,54],"sets,":[30],"Grounded":[31,133,165],"SAM":[32,166],"uses":[33],"arbitrary":[34],"textual":[35,72,101,107],"inputs":[36],"definition,":[39],"offering":[40],"enhanced":[41],"flexibility":[42],"and":[43,52,63,75,125,179],"adaptability.":[44],"The":[45,65,155],"model\u2019s":[46],"performance":[47,86,186],"was":[48],"evaluated":[49],"across":[50],"single":[51],"multiple":[53],"tasks":[55],"using":[56],"benchmark":[58],"datasets":[59],"Cityscapes,":[60],"BDD100K,":[61],"GTA5,":[62],"KITTI.":[64],"focused":[67],"impact":[70],"input":[73],"refinement":[74],"challenges":[77,114],"classifying":[79],"visually":[80,119],"similar":[81,120],"categories.":[82],"Results":[83],"indicate":[84],"strong":[85],"in":[87,93,106,116,171,176,187],"single-category":[88],"but":[90],"highlighted":[91],"difficulties":[92],"multi-category":[94],"scenarios,":[95],"particularly":[96,137],"with":[97,129],"categories":[98],"bearing":[99],"close":[100],"or":[102],"visual":[103],"resemblances.":[104],"Adjustments":[105],"prompts":[108],"significantly":[109],"improved":[110],"detection":[111],"accuracy,":[112],"though":[113],"persisted":[115],"distinguishing":[117],"between":[118],"objects":[121],"such":[122,163],"as":[123,164],"buses":[124],"trains.":[126],"Comparative":[127],"analysis":[128],"state-of-the-art":[130],"revealed":[132],"SAM\u2019s":[134],"competitive":[135],"performance,":[136],"notable":[138],"given":[139],"its":[140],"direct":[141],"inference":[142],"capability":[143],"without":[144],"extensive":[145],"dataset-specific":[146],"training.":[147],"feature":[149],"is":[150],"advantageous":[151],"resource-limited":[153],"applications.":[154],"concludes":[157],"that":[158],"while":[159],"vocabulary":[161],"mark":[167],"a":[168],"significant":[169],"advancement":[170],"segmentation,":[173],"further":[174],"improvements":[175],"integrating":[177],"image":[178],"text":[180],"processing":[181],"are":[182],"essential":[183],"better":[185],"scenarios.":[189]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
