{"id":"https://openalex.org/W2908561850","doi":"https://doi.org/10.5220/0007248401730180","title":"Multi-stream CNN based Video Semantic Segmentation for Automated Driving","display_name":"Multi-stream CNN based Video Semantic Segmentation for Automated Driving","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2908561850","doi":"https://doi.org/10.5220/0007248401730180","mag":"2908561850"},"language":"en","primary_location":{"id":"doi:10.5220/0007248401730180","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0007248401730180","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0007248401730180","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Ganesh Sistu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126639","display_name":"Valeo (Ireland)","ror":"https://ror.org/031sgpn76","country_code":"IE","type":"company","lineage":["https://openalex.org/I220619192","https://openalex.org/I4210126639"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Ganesh Sistu","raw_affiliation_strings":["Valeo Vision Systems and Ireland, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Valeo Vision Systems and Ireland, --- Select a Country ---","institution_ids":["https://openalex.org/I4210126639"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Sumanth Chennupati","orcid":null},"institutions":[{"id":"https://openalex.org/I4210166119","display_name":"Valeo (United States)","ror":"https://ror.org/05x7wqc91","country_code":"US","type":"company","lineage":["https://openalex.org/I220619192","https://openalex.org/I4210166119"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sumanth Chennupati","raw_affiliation_strings":["Valeo Troy and U.S.A., --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Valeo Troy and U.S.A., --- Select a Country ---","institution_ids":["https://openalex.org/I4210166119"]}]},{"author_position":"last","author":{"id":null,"display_name":"Senthil Yogamani","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126639","display_name":"Valeo (Ireland)","ror":"https://ror.org/031sgpn76","country_code":"IE","type":"company","lineage":["https://openalex.org/I220619192","https://openalex.org/I4210126639"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Senthil Yogamani","raw_affiliation_strings":["Valeo Vision Systems and Ireland, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Valeo Vision Systems and Ireland, --- Select a Country ---","institution_ids":["https://openalex.org/I4210126639"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210126639"],"apc_list":null,"apc_paid":null,"fwci":0.7152,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.74101652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"173","last_page":"180"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.8176000118255615},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6370000243186951},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.6083999872207642},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6065000295639038},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5523999929428101},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.44780001044273376},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3984000086784363},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.38179999589920044}],"concepts":[{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.8176000118255615},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8080999851226807},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6851999759674072},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6370000243186951},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.6083999872207642},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6065000295639038},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5724999904632568},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5523999929428101},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.44780001044273376},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3984000086784363},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.38179999589920044},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3783999979496002},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.37299999594688416},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3693999946117401},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.3537999987602234},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.33169999718666077},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C3261483","wikidata":"https://www.wikidata.org/wiki/Q119565","display_name":"Frame rate","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2775000035762787},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.25870001316070557}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0007248401730180","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0007248401730180","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1901.02511","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1901.02511","pdf_url":"https://arxiv.org/pdf/1901.02511","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.5220/0007248401730180","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0007248401730180","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Majority":[0],"of":[1,14,55,73,99,106,118,160,177],"semantic":[2],"segmentation":[3],"algorithms":[4],"operate":[5],"on":[6,44],"a":[7,57,77,86],"single":[8],"frame":[9],"even":[10],"in":[11,129,188],"the":[12,19,27,65,71,90,111,130,150,168,193],"case":[13,54],"videos.":[15],"In":[16,53],"this":[17],"work,":[18],"goal":[20],"is":[21,62],"to":[22,192],"exploit":[23],"temporal":[24,35],"information":[25],"within":[26],"algorithm":[28],"model":[29],"for":[30,122,143,181],"leveraging":[31],"motion":[32],"cues":[33],"and":[34,48,67,93,104,120,124,141,146,162,179,183],"consistency.":[36],"We":[37,84,154],"propose":[38],"two":[39,169],"simple":[40],"high-level":[41],"architectures":[42],"based":[43],"Recurrent":[45],"FCN":[46,50,152],"(RFCN)":[47],"Multi-Stream":[49],"(MSFCN)":[51],"networks.":[52],"RFCN,":[56],"recurrent":[58],"network":[59,88],"namely":[60,97],"LSTM":[61],"inserted":[63],"between":[64],"encoder":[66,79,92],"decoder.":[68],"MSFCN":[69,98],"combines":[70],"encoders":[72],"different":[74],"frames":[75],"into":[76],"fused":[78],"via":[80],"1x1":[81],"channel-wise":[82],"convolution.":[83],"use":[85],"ResNet50":[87],"as":[89],"baseline":[91,151,194],"construct":[94],"three":[95],"networks":[96],"order":[100,107],"2":[101],"&":[102],"3":[103],"RFCN":[105],"2.":[108],"MSFCN-3":[109,137],"produces":[110],"best":[112],"results":[113],"with":[114,185],"an":[115,157,175],"accuracy":[116],"improvement":[117,176],"9%":[119],"15%":[121],"Highway":[123],"New":[125],"York-like":[126],"city":[127],"scenarios":[128],"SYNTHIA-CVPR'16":[131],"dataset":[132],"using":[133,164],"mean":[134],"IoU":[135],"metric.":[136],"also":[138,155],"produced":[139],"11%":[140,178],"6%":[142],"SegTrack":[144],"V2":[145],"DAVIS":[147],"datasets":[148],"over":[149],"network.":[153],"designed":[156],"efficient":[158,172],"version":[159],"MSFCN-2":[161,173],"RFCN-2":[163],"weight":[165],"sharing":[166],"among":[167],"encoders.":[170],"The":[171],"provided":[174],"5%":[180],"KITTI":[182],"SYNTHIA":[184],"negligible":[186],"increase":[187],"computational":[189],"complexity":[190],"compared":[191],"version.":[195]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2019-01-25T00:00:00"}
