{"id":"https://openalex.org/W4403792307","doi":"https://doi.org/10.1145/3664647.3680879","title":"CartoonNet: Cartoon Parsing with Semantic Consistency and Structure Correlation","display_name":"CartoonNet: Cartoon Parsing with Semantic Consistency and Structure Correlation","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403792307","doi":"https://doi.org/10.1145/3664647.3680879"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680879","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680879","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045727713","display_name":"Jian-Jun Qiao","orcid":"https://orcid.org/0000-0003-4282-0149"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jian-Jun Qiao","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101289085","display_name":"Mengyu Duan","orcid":"https://orcid.org/0009-0005-3230-9656"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng-Yu Duan","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011680564","display_name":"Xiao Wu","orcid":"https://orcid.org/0000-0002-8322-8558"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Wu","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060458860","display_name":"Y. J. Song","orcid":"https://orcid.org/0009-0004-3500-0200"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Pei Song","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5045727713"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19275803,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"729","last_page":"737"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9678999781608582,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8031983375549316},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7917587757110596},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.7181782126426697},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6080377697944641},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5626547932624817},{"id":"https://openalex.org/keywords/correlation","display_name":"Correlation","score":0.5200228691101074},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4528244435787201},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12808451056480408}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8031983375549316},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7917587757110596},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.7181782126426697},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6080377697944641},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5626547932624817},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.5200228691101074},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4528244435787201},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12808451056480408},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680879","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680879","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5099999904632568,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2412782625","https://openalex.org/W2598915960","https://openalex.org/W2799166040","https://openalex.org/W2894913190","https://openalex.org/W2963881378","https://openalex.org/W2964252655","https://openalex.org/W2981959899","https://openalex.org/W3014641072","https://openalex.org/W3040822117","https://openalex.org/W3096399932","https://openalex.org/W3115879670","https://openalex.org/W4312657985"],"related_works":["https://openalex.org/W579810227","https://openalex.org/W2142145894","https://openalex.org/W2952780262","https://openalex.org/W2979495269","https://openalex.org/W2392917763","https://openalex.org/W2358855848","https://openalex.org/W4381248170","https://openalex.org/W3189621521","https://openalex.org/W2173794830","https://openalex.org/W1502858101"],"abstract_inverted_index":{"Cartoon":[0],"parsing":[1,32,179,182,198],"is":[2,45,75,118,149],"an":[3],"important":[4],"task":[5],"for":[6,47,67,102,196],"cartoon-centric":[7],"applications,":[8],"which":[9,51,104,191],"segments":[10],"the":[11,19,61,79,96,108,113,130,138,160,185,188,193],"body":[12,126],"parts":[13,127],"of":[14,28,91,112,142,187],"cartoon":[15,29,31,48,68,84,143,170,178,197],"images.":[16],"Due":[17],"to":[18,59,77,99,106,120,129,168],"complex":[20,173],"appearances,":[21],"abstract":[22],"drawing":[23],"styles,":[24],"and":[25,54,64,94,133,155,180,199],"irregular":[26],"structures":[27],"characters,":[30],"remains":[33],"a":[34,40,145,156],"challenging":[35],"task.":[36],"In":[37],"this":[38],"paper,":[39],"novel":[41],"approach,":[42],"named":[43],"CartoonNet,":[44],"proposed":[46,161,189],"parsing,":[49],"in":[50],"semantic":[52,72,109],"consistency":[53,73,122],"structure":[55,146],"correlation":[56,147],"are":[57],"integrated":[58],"address":[60],"visual":[62],"diversity":[63],"structural":[65,140,164],"complexity":[66],"parsing.":[69,205],"A":[70,115],"memory-based":[71],"module":[74,148],"designed":[76],"learn":[78],"diverse":[80,92,125],"appearances":[81],"exhibited":[82],"by":[83],"characters.":[85],"The":[86],"memory":[87],"bank":[88],"stores":[89],"features":[90],"samples":[93,97,101,132],"retrieves":[95],"related":[98],"new":[100,134],"consistency,":[103],"aims":[105],"improve":[107],"reasoning":[110],"capability":[111],"network.":[114],"self-attention":[116],"mechanism":[117],"employed":[119],"conduct":[121],"learning":[123],"among":[124],"belong":[128],"retrieved":[131],"samples.":[135],"To":[136],"capture":[137],"intricate":[139],"information":[141],"images,":[144],"proposed.":[150],"Leveraging":[151],"graph":[152],"attention":[153],"networks":[154],"main":[157],"body-aware":[158],"mechanism,":[159],"approach":[162],"enables":[163],"correlation,":[165],"allowing":[166],"it":[167],"parse":[169],"images":[171],"with":[172],"structures.":[174],"Experiments":[175],"conducted":[176],"on":[177,203],"human":[181,204],"datasets":[183],"demonstrate":[184],"effectiveness":[186],"method,":[190],"outperforms":[192],"state-of-the-art":[194],"approaches":[195],"achieves":[200],"competitive":[201],"performance":[202]},"counts_by_year":[],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
