{"id":"https://openalex.org/W4313318649","doi":"https://doi.org/10.1109/tmm.2022.3233258","title":"Simultaneously Training and Compressing Vision-and-Language Pre-Training Model","display_name":"Simultaneously Training and Compressing Vision-and-Language Pre-Training Model","publication_year":2022,"publication_date":"2022-12-30","ids":{"openalex":"https://openalex.org/W4313318649","doi":"https://doi.org/10.1109/tmm.2022.3233258"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2022.3233258","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2022.3233258","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091480702","display_name":"Qiaosong Qi","orcid":"https://orcid.org/0000-0002-9977-967X"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiaosong Qi","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049610245","display_name":"Aixi Zhang","orcid":"https://orcid.org/0000-0001-9863-0091"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aixi Zhang","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9863-0091","affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002061412","display_name":"Yue Liao","orcid":"https://orcid.org/0000-0002-2671-0655"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Liao","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2671-0655","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100650059","display_name":"Wenyu Sun","orcid":"https://orcid.org/0000-0001-8478-7346"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenyu Sun","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431048","display_name":"Yongliang Wang","orcid":"https://orcid.org/0000-0001-7823-6345"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongliang Wang","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100318755","display_name":"Xiaobo Li","orcid":"https://orcid.org/0000-0002-8074-0230"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaobo Li","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-8074-0230","affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100330138","display_name":"Si Liu","orcid":"https://orcid.org/0000-0002-9180-2935"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Si Liu","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9180-2935","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4061,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.6115698,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"25","issue":null,"first_page":"8194","last_page":"8203"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9739000201225281,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9681000113487244,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6604500412940979},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6227239370346069},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5677253007888794},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4383730888366699},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.16677069664001465}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6604500412940979},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6227239370346069},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5677253007888794},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4383730888366699},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.16677069664001465}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2022.3233258","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2022.3233258","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5696407354","display_name":null,"funder_award_id":"62122010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7834498664","display_name":null,"funder_award_id":"61876177","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W1821462560","https://openalex.org/W1889081078","https://openalex.org/W2277195237","https://openalex.org/W2425121537","https://openalex.org/W2739879705","https://openalex.org/W2896457183","https://openalex.org/W2912423076","https://openalex.org/W2921940552","https://openalex.org/W2926312400","https://openalex.org/W2946794439","https://openalex.org/W2948427397","https://openalex.org/W2952132648","https://openalex.org/W2969897437","https://openalex.org/W2970231061","https://openalex.org/W2970454332","https://openalex.org/W2975357369","https://openalex.org/W2978017171","https://openalex.org/W2978832950","https://openalex.org/W2981851019","https://openalex.org/W2984008963","https://openalex.org/W2987809065","https://openalex.org/W2987861506","https://openalex.org/W2990138076","https://openalex.org/W3005881764","https://openalex.org/W3030163527","https://openalex.org/W3034457371","https://openalex.org/W3035030897","https://openalex.org/W3090449556","https://openalex.org/W3101248447","https://openalex.org/W3105966348","https://openalex.org/W3106146634","https://openalex.org/W3122091215","https://openalex.org/W3139732141","https://openalex.org/W3157413304","https://openalex.org/W3158375352","https://openalex.org/W3164325351","https://openalex.org/W3168640669","https://openalex.org/W3173223111","https://openalex.org/W3175095612","https://openalex.org/W3176055902","https://openalex.org/W3190446228","https://openalex.org/W3204610735","https://openalex.org/W3205825741","https://openalex.org/W3205832214","https://openalex.org/W3206020652","https://openalex.org/W3207324131","https://openalex.org/W3208922547","https://openalex.org/W4288089799","https://openalex.org/W4394659899","https://openalex.org/W6637551013","https://openalex.org/W6638523607","https://openalex.org/W6639432524","https://openalex.org/W6730179637","https://openalex.org/W6739917289","https://openalex.org/W6751612189","https://openalex.org/W6755207826","https://openalex.org/W6762945437","https://openalex.org/W6763701032","https://openalex.org/W6766904570","https://openalex.org/W6767211374","https://openalex.org/W6767853649","https://openalex.org/W6768021236","https://openalex.org/W6768080748","https://openalex.org/W6768851824","https://openalex.org/W6768869542","https://openalex.org/W6769627184","https://openalex.org/W6770515439","https://openalex.org/W6773911639","https://openalex.org/W6775706467","https://openalex.org/W6790978476","https://openalex.org/W6864544085"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2530322880","https://openalex.org/W1596801655","https://openalex.org/W2359140296"],"abstract_inverted_index":{"Model":[0],"compression":[1,22,64,118,141,181,209],"is":[2,205],"an":[3,57,138,151],"essential":[4],"step":[5],"for":[6,73,211],"large-scale":[7],"pre-training":[8,201],"models":[9],"toward":[10],"practical":[11],"application":[12],"and":[13,44,55,59,76,96,122,133,189,203,228,230,240],"deployment":[14],"on":[15,219],"the":[16,52,124,130,144,159,169,185,206,231],"edge":[17],"device.":[18],"However,":[19],"when":[20],"conventional":[21,145],"methods":[23],"following":[24],"\u2018pre-training":[25],"then":[26],"compressing\u2019":[27],"two-phase":[28,53,146],"pipeline":[29,54],"are":[30],"applied":[31],"to":[32,40,120,128,157,182],"Vision-and-Language":[33],"Pre-training":[34],"(VLP)":[35],"models,":[36,222],"it":[37,204],"will":[38],"lead":[39],"a":[41,116,194,235],"high":[42],"calculation":[43,132],"memory":[45,134],"overhead.":[46],"In":[47],"this":[48],"work,":[49],"we":[50,114,149,174,192],"break":[51],"propose":[56,150],"efficient":[58],"effective":[60],"one-phase":[61,117,208],"VLP":[62,82,125,179,196,212,221],"model":[63,83,126,140,160,180,186,197],"mechanism,":[65],"named":[66],"<bold":[67,78,87,92,98,102],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[68,79,88,93,99,103,224],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">REDUCER</b>":[69],",":[70,226],"which":[71],"stands":[72],"\u2018simultaneously":[74],"training":[75],"comp":[77],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">RE</b>":[80],"ssing\u2019":[81],"via":[84],"progressive":[85,153],"mo":[86],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">DU</b>":[89],"le":[90],"repla":[91],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">C</b>":[94],"ing":[95],"n":[97],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">E</b>":[100],"twork":[101],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">R</b>":[104],"ewiring.":[105],"Specifically,":[106],"REDUCER":[107],"consists":[108],"of":[109],"three":[110],"insightful":[111],"designs.":[112],"Firstly,":[113],"design":[115],"framework":[119],"train":[121],"compress":[123,158,184],"simultaneously":[127,183],"avoid":[129],"extra":[131],"cost":[135],"caused":[136],"by":[137],"isolated":[139],"phase":[142],"in":[143,187],"pipeline.":[147],"Secondly,":[148],"adaptive":[152],"module":[154],"replacing":[155],"mechanism":[156],"depth":[161],"free":[162],"from":[163],"explicit":[164],"knowledge":[165],"distillation":[166],"losses,":[167],"relieving":[168],"multi-task":[170],"optimization":[171],"problems.":[172],"Thirdly,":[173],"integrate":[175],"pruning":[176],"techniques":[177],"into":[178],"width":[188],"depth.":[190],"Overall,":[191],"obtain":[193],"lightweight":[195],"with":[198],"only":[199],"one":[200],"phase,":[202],"first":[207],"method":[210],"models.":[213],"Extensive":[214],"experiments":[215],"have":[216],"been":[217],"conducted":[218],"representative":[220],"<italic":[223],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">i.e.</i>":[225],"ClipBERT":[227],"VICTOR,":[229],"experimental":[232],"results":[233],"show":[234],"superior":[236],"trade-off":[237],"between":[238],"performance":[239],"efficiency.":[241]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
