{"id":"https://openalex.org/W7128608257","doi":"https://doi.org/10.1109/icnsc66229.2025.00049","title":"A Method for Generating Elevator Detection Video Texts Based on Semantic Recognition","display_name":"A Method for Generating Elevator Detection Video Texts Based on Semantic Recognition","publication_year":2025,"publication_date":"2025-10-01","ids":{"openalex":"https://openalex.org/W7128608257","doi":"https://doi.org/10.1109/icnsc66229.2025.00049"},"language":null,"primary_location":{"id":"doi:10.1109/icnsc66229.2025.00049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icnsc66229.2025.00049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Networking, Sensing and Control (ICNSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125626380","display_name":"Hongyi Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117890","display_name":"Sichuan Entry-Exit Inspection and Quarantine Bureau","ror":"https://ror.org/02490t938","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210117890"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongyi Chen","raw_affiliation_strings":["Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan"],"affiliations":[{"raw_affiliation_string":"Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan","institution_ids":["https://openalex.org/I4210117890"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125660830","display_name":"Yuhui Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117890","display_name":"Sichuan Entry-Exit Inspection and Quarantine Bureau","ror":"https://ror.org/02490t938","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210117890"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhui Peng","raw_affiliation_strings":["Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan"],"affiliations":[{"raw_affiliation_string":"Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan","institution_ids":["https://openalex.org/I4210117890"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074071157","display_name":"Yixiang Yuan","orcid":"https://orcid.org/0009-0007-5421-3406"},"institutions":[{"id":"https://openalex.org/I4210117890","display_name":"Sichuan Entry-Exit Inspection and Quarantine Bureau","ror":"https://ror.org/02490t938","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210117890"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixiang Yuan","raw_affiliation_strings":["Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan"],"affiliations":[{"raw_affiliation_string":"Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan","institution_ids":["https://openalex.org/I4210117890"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059625416","display_name":"Zhanbin Zhang","orcid":"https://orcid.org/0009-0004-1391-0801"},"institutions":[{"id":"https://openalex.org/I4210117890","display_name":"Sichuan Entry-Exit Inspection and Quarantine Bureau","ror":"https://ror.org/02490t938","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210117890"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhanbin Zhang","raw_affiliation_strings":["Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan"],"affiliations":[{"raw_affiliation_string":"Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan","institution_ids":["https://openalex.org/I4210117890"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062203736","display_name":"Yujie Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117890","display_name":"Sichuan Entry-Exit Inspection and Quarantine Bureau","ror":"https://ror.org/02490t938","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210117890"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yujie Chen","raw_affiliation_strings":["Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan"],"affiliations":[{"raw_affiliation_string":"Sichuan Special Equipment Inspection Institute,Chengdu,Sichuan","institution_ids":["https://openalex.org/I4210117890"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112367951","display_name":"Jianhong Gan","orcid":null},"institutions":[{"id":"https://openalex.org/I24201400","display_name":"Chengdu University of Information Technology","ror":"https://ror.org/01yxwrh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I24201400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhong Gan","raw_affiliation_strings":["Chengdu University of Information Technology,Chengdu,Sichuan"],"affiliations":[{"raw_affiliation_string":"Chengdu University of Information Technology,Chengdu,Sichuan","institution_ids":["https://openalex.org/I24201400"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5125626380"],"corresponding_institution_ids":["https://openalex.org/I4210117890"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.72313467,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"249","last_page":"254"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.7644000053405762,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.7644000053405762,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12206","display_name":"Vibration and Dynamic Analysis","score":0.029899999499320984,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.026200000196695328,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/elevator","display_name":"Elevator","score":0.7998999953269958},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6482999920845032},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.645799994468689},{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.5038999915122986},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.44290000200271606},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4223000109195709},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4178999960422516},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.41530001163482666},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3984000086784363}],"concepts":[{"id":"https://openalex.org/C147021018","wikidata":"https://www.wikidata.org/wiki/Q252451","display_name":"Elevator","level":2,"score":0.7998999953269958},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7911999821662903},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6482999920845032},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.645799994468689},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5760999917984009},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.5038999915122986},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.44290000200271606},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4223000109195709},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4178999960422516},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41530001163482666},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4146000146865845},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3984000086784363},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.38670000433921814},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3718000054359436},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3684000074863434},{"id":"https://openalex.org/C2983812711","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text recognition","level":3,"score":0.3352999985218048},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3154999911785126},{"id":"https://openalex.org/C194789388","wikidata":"https://www.wikidata.org/wiki/Q17855283","display_name":"CAD","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.2939999997615814},{"id":"https://openalex.org/C180863505","wikidata":"https://www.wikidata.org/wiki/Q5439687","display_name":"Feature recognition","level":3,"score":0.29019999504089355},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C193125573","wikidata":"https://www.wikidata.org/wiki/Q7449065","display_name":"Semantic interpretation","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2800999879837036},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C2983589003","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text detection","level":3,"score":0.25380000472068787}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icnsc66229.2025.00049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icnsc66229.2025.00049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Networking, Sensing and Control (ICNSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4265974164009094,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"When":[0],"retrieving":[1],"and":[2,27,46,51,71,103,120,125,165,174,180],"checking":[3],"elevator":[4,34,159,186],"inspection":[5,35,178],"videos,":[6],"manual":[7],"processing":[8],"has":[9,113],"problems,":[10],"such":[11,122],"as":[12,123,162],"low":[13],"efficiency,":[14],"strong":[15],"subjectivity.":[16],"This":[17],"paper":[18],"proposes":[19],"a":[20],"video-to-text":[21],"method":[22],"based":[23],"on":[24],"semantic":[25,44,82],"segmentation":[26],"other":[28,139,153],"language":[29],"models.":[30,140,154],"The":[31,127,141],"model":[32,79,112],"converts":[33],"videos":[36],"into":[37],"texts":[38],"by":[39],"means":[40],"of":[41,74,99,118,176],"keyframe":[42],"extraction,":[43],"recognition":[45],"segmentation,":[47],"dual-path":[48,60],"feature":[49,61],"encoding,":[50],"text":[52,86,179],"generation":[53],"using":[54],"the":[55,65,72,75,78,96,110,172],"Blip":[56],"model.":[57],"It":[58,155,169],"uses":[59],"encoding.":[62],"By":[63],"fusing":[64],"encoded":[66],"Mask":[67],"features":[68,73],"from":[69],"UNet":[70],"input":[76],"images,":[77],"provides":[80,181],"image":[81],"support":[83,183],"for":[84,184],"accurate":[85],"generation.":[87],"A":[88],"collaborative":[89],"loss":[90],"function":[91],"is":[92,129,132,143,146],"proposed,":[93],"which":[94,131,145],"weights":[95],"cross-entropy":[97],"losses":[98],"UNet,":[100],"BLIP":[101],"model,":[102],"real":[104],"labels.":[105],"Experimental":[106],"results":[107],"show":[108],"that":[109],"proposed":[111],"better":[114],"performance":[115],"in":[116],"terms":[117],"CIDEr":[119,128],"SPICE,":[121],"BLIP2":[124],"LLaVA.":[126],"123.7,":[130],"2.7":[133,147],"to":[134,148],"5.4":[135,149],"times":[136,150],"higher":[137,151],"than":[138,152],"SPICE":[142],"18.9,":[144],"can":[156],"accurately":[157],"identify":[158],"parts":[160],"(such":[161],"drive":[163],"motors)":[164],"generate":[166],"professional":[167],"descriptions.":[168],"effectively":[170],"improves":[171],"quality":[173],"efficiency":[175],"generating":[177],"technical":[182],"smarter":[185],"inspection.":[187]},"counts_by_year":[],"updated_date":"2026-02-12T06:17:30.163165","created_date":"2026-02-12T00:00:00"}
