{"id":"https://openalex.org/W7161683463","doi":"https://doi.org/10.48550/arxiv.2605.18328","title":"CineMatte: Background Matting for Virtual Production and Beyond","display_name":"CineMatte: Background Matting for Virtual Production and Beyond","publication_year":2026,"publication_date":"2026-05-18","ids":{"openalex":"https://openalex.org/W7161683463","doi":"https://doi.org/10.48550/arxiv.2605.18328"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.18328","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18328","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.18328","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136456829","display_name":"Yuanjian He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Yuanjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136462782","display_name":"Chen Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136503158","display_name":"Fasheng Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Fasheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136491340","display_name":"Jiangbo Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Jiangbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.885699987411499,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.885699987411499,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.06960000097751617,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.009600000455975533,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6722999811172485},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4722000062465668},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4399999976158142},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4212999939918518},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.3492000102996826},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.2761000096797943},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.2741999924182892}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7437999844551086},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6832000017166138},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6722999811172485},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6599000096321106},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4722000062465668},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4399999976158142},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4212999939918518},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3492000102996826},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2741999924182892},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2727999985218048},{"id":"https://openalex.org/C3261483","wikidata":"https://www.wikidata.org/wiki/Q119565","display_name":"Frame rate","level":2,"score":0.2705000042915344},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.25380000472068787}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.18328","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18328","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.18328","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18328","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.7131059765815735,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LED":[0,6,148],"Virtual":[1],"Production":[2],"(VP)":[3],"uses":[4],"large":[5],"volumes":[7],"to":[8,61,78,88,101,114,211],"render":[9],"backgrounds":[10,186],"in":[11,110,205],"real":[12],"time,":[13],"enabling":[14],"in-camera":[15],"visual":[16],"effects":[17],"but":[18,207],"making":[19],"post-shot":[20],"changes":[21],"labor-intensive.":[22],"We":[23,120,135],"address":[24],"this":[25],"with":[26,47,58,117,124,180,191],"CineMatte,":[27],"a":[28,39,52,96,125,139,146],"robust":[29],"background":[30,46,69,89],"matting":[31,93,166],"framework":[32],"for":[33,164],"VP":[34,149,165,206],"and":[35,66,85,167,196],"beyond.":[36],"CineMatte":[37,50,201],"employs":[38,51],"cross-attention-conditioned":[40],"design.":[41],"Instead":[42],"of":[43,154],"concatenating":[44],"the":[45,48,63,67,75,80,118,133,152,157,161,174],"input,":[49],"Siamese,":[53],"frozen":[54],"DINOv3":[55],"Vision":[56],"Transformer":[57],"shared":[59],"weights":[60],"encode":[62],"input":[64],"frame":[65],"captured":[68,144],"separately.":[70],"A":[71],"cross-attention":[72],"module":[73],"compares":[74],"two":[76],"streams":[77],"predict":[79],"foreground,":[81],"preserving":[82],"pretrained":[83],"semantics":[84],"improving":[86],"robustness":[87],"shifts.":[90],"Previous":[91],"ViT-based":[92],"models":[94],"use":[95],"parallel":[97],"convolutional":[98],"\"detail":[99],"branch\"":[100],"recover":[102],"fine":[103],"details,":[104],"which":[105,130],"can":[106,187],"cause":[107],"boundary":[108],"artifacts":[109],"real-world":[111,212],"samples":[112],"due":[113],"semantic":[115],"misalignment":[116],"backbone.":[119],"instead":[121],"replace":[122],"it":[123],"pretrained,":[126],"image-guided":[127],"feature":[128],"upsampler,":[129],"largely":[131],"mitigates":[132],"problem.":[134],"also":[136,208],"introduce":[137],"CineMatte-4K,":[138],"4K":[140],"HDR":[141],"image-video":[142],"dataset":[143,163],"on":[145],"professional":[147],"stage.":[150],"To":[151],"best":[153],"our":[155],"knowledge,":[156],"image":[158],"subset":[159,176],"is":[160,168],"first":[162],"non-synthetic,":[169],"obtained":[170],"via":[171],"green-screen":[172],"insertion;":[173],"video":[175],"includes":[177],"camera":[178],"motion":[179],"tracked":[181],"trajectories":[182],"so":[183],"that":[184],"arbitrary":[185],"be":[188],"rendered":[189],"later":[190],"correct":[192],"parallax.":[193],"Across":[194],"CineMatte-4K":[195],"public":[197],"benchmarks":[198],"(VideoMatte240K,":[199],"YouTubeMatte),":[200],"not":[202],"only":[203],"excels":[204],"generalizes":[209],"robustly":[210],"footage.":[213]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-05-20T00:00:00"}
