{"id":"https://openalex.org/W4383503846","doi":"https://doi.org/10.1109/tcsvt.2023.3292995","title":"Multi-Task Learning With Multi-Query Transformer for Dense Prediction","display_name":"Multi-Task Learning With Multi-Query Transformer for Dense Prediction","publication_year":2023,"publication_date":"2023-07-07","ids":{"openalex":"https://openalex.org/W4383503846","doi":"https://doi.org/10.1109/tcsvt.2023.3292995"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3292995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3292995","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077429843","display_name":"Yangyang Xu","orcid":"https://orcid.org/0000-0002-7098-8419"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yangyang Xu","raw_affiliation_strings":["Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0002-7098-8419","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089900108","display_name":"Xiangtai Li","orcid":"https://orcid.org/0000-0002-0550-8247"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xiangtai Li","raw_affiliation_strings":["S-Lab, Nanyang Technological University, Nanyang Ave, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-0550-8247","affiliations":[{"raw_affiliation_string":"S-Lab, Nanyang Technological University, Nanyang Ave, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042527481","display_name":"Haobo Yuan","orcid":"https://orcid.org/0000-0001-9770-7720"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haobo Yuan","raw_affiliation_strings":["Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0001-9770-7720","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103072699","display_name":"Yibo Yang","orcid":"https://orcid.org/0000-0003-0530-7231"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibo Yang","raw_affiliation_strings":["JD Explore Academy, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0530-7231","affiliations":[{"raw_affiliation_string":"JD Explore Academy, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024278302","display_name":"Lefei Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lefei Zhang","raw_affiliation_strings":["Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0003-0542-2280","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5077429843"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":10.9061,"has_fulltext":false,"cited_by_count":64,"citation_normalized_percentile":{"value":0.98829157,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"34","issue":"2","first_page":"1228","last_page":"1240"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8586966395378113},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5190468430519104},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.45628035068511963},{"id":"https://openalex.org/keywords/sargable","display_name":"Sargable","score":0.412738174200058},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40540599822998047},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.30992329120635986},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.2588931918144226},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.21556544303894043},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.17307376861572266}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8586966395378113},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5190468430519104},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.45628035068511963},{"id":"https://openalex.org/C192939062","wikidata":"https://www.wikidata.org/wiki/Q104840822","display_name":"Sargable","level":4,"score":0.412738174200058},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40540599822998047},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30992329120635986},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2588931918144226},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.21556544303894043},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.17307376861572266},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3292995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3292995","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7684016204","display_name":null,"funder_award_id":"62122060","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":74,"referenced_works":["https://openalex.org/W125693051","https://openalex.org/W2104408738","https://openalex.org/W2565639579","https://openalex.org/W2787091153","https://openalex.org/W2798441115","https://openalex.org/W2895250390","https://openalex.org/W2916798096","https://openalex.org/W2941769495","https://openalex.org/W2955639361","https://openalex.org/W2959581809","https://openalex.org/W2963430933","https://openalex.org/W2963677766","https://openalex.org/W2963877604","https://openalex.org/W2963881378","https://openalex.org/W2964247799","https://openalex.org/W2981801509","https://openalex.org/W2982152811","https://openalex.org/W2997473137","https://openalex.org/W3026081963","https://openalex.org/W3035276179","https://openalex.org/W3048093647","https://openalex.org/W3081167590","https://openalex.org/W3096609285","https://openalex.org/W3097571420","https://openalex.org/W3106901158","https://openalex.org/W3110440461","https://openalex.org/W3121523901","https://openalex.org/W3121709906","https://openalex.org/W3122412340","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3143320354","https://openalex.org/W3168984673","https://openalex.org/W3172863135","https://openalex.org/W3174280965","https://openalex.org/W3177645420","https://openalex.org/W3180150746","https://openalex.org/W3181286780","https://openalex.org/W3196107618","https://openalex.org/W3204397973","https://openalex.org/W3204786153","https://openalex.org/W3212386989","https://openalex.org/W3212972574","https://openalex.org/W4214520160","https://openalex.org/W4214524539","https://openalex.org/W4221152259","https://openalex.org/W4225493926","https://openalex.org/W4285104720","https://openalex.org/W4287685869","https://openalex.org/W4303645333","https://openalex.org/W4312257978","https://openalex.org/W4312391970","https://openalex.org/W4312433447","https://openalex.org/W4312444067","https://openalex.org/W4312511177","https://openalex.org/W4312598093","https://openalex.org/W4312612915","https://openalex.org/W4312695182","https://openalex.org/W4312796324","https://openalex.org/W4312844845","https://openalex.org/W4313023122","https://openalex.org/W4313166855","https://openalex.org/W4315705623","https://openalex.org/W4320015877","https://openalex.org/W6684360038","https://openalex.org/W6739901393","https://openalex.org/W6770205404","https://openalex.org/W6782322686","https://openalex.org/W6784094891","https://openalex.org/W6797235774","https://openalex.org/W6810835471","https://openalex.org/W6843355076","https://openalex.org/W6845518869","https://openalex.org/W6853042510"],"related_works":["https://openalex.org/W2006459955","https://openalex.org/W2955368753","https://openalex.org/W3125756434","https://openalex.org/W2184296057","https://openalex.org/W203907944","https://openalex.org/W4386051213","https://openalex.org/W2096359267","https://openalex.org/W2992414350","https://openalex.org/W1819934925","https://openalex.org/W185198413"],"abstract_inverted_index":{"Previous":[0],"multi-task":[1],"dense":[2,80,212],"prediction":[3,213],"studies":[4],"developed":[5],"complex":[6],"pipelines":[7],"such":[8],"as":[9],"multi-modal":[10],"distillations":[11],"in":[12],"multiple":[13,58,68,96,173],"stages":[14],"or":[15],"searching":[16],"for":[17,21],"task":[18,126],"relational":[19],"contexts":[20],"each":[22,37,99,125],"task.":[23,38],"The":[24,105],"core":[25],"insight":[26],"beyond":[27],"these":[28],"methods":[29],"is":[30,55,107,223],"to":[31,63,91,168,180,193],"maximize":[32],"the":[33,41,65,72,79,102,133,138,142,148,153,157,170,178,184,196,200,220],"mutual":[34],"effects":[35],"of":[36,77,109],"Inspired":[39],"by":[40,137],"recent":[42],"query-based":[43],"Transformers,":[44],"we":[45,86,161,188],"propose":[46],"a":[47,88,128,163,190],"simple":[48],"pipeline":[49],"named":[50],"Multi-Query":[51],"Transformer":[52],"(MQTransformer)":[53],"that":[54,219],"equipped":[56],"with":[57,127,199],"queries":[59,97],"from":[60,156,204],"different":[61,84,205],"tasks":[62,69],"facilitate":[64],"reasoning":[66,94],"among":[67,83,172],"and":[70,119,141,216,227,232],"simplify":[71],"cross-task":[73,93,115,164],"interaction":[74],"pipeline.":[75],"Instead":[76],"modeling":[78],"per-pixel":[81],"context":[82],"tasks,":[85],"seek":[87],"task-specific":[89,134,158],"proxy":[90],"perform":[92],"via":[95],"where":[98],"query":[100,116,144,155,165,202],"encodes":[101],"task-related":[103],"context.":[104],"MQTransformer":[106],"composed":[108],"three":[110],"key":[111],"components:":[112],"shared":[113,120,149,191],"encoder,":[114,150],"attention":[117,166],"module":[118,167,179],"decoder.":[121],"We":[122],"first":[123],"model":[124],"task-relevant":[129,143,154,174],"query.":[130],"Then":[131],"both":[132],"feature":[135,139],"output":[136],"extractor":[140],"are":[145,234],"fed":[146],"into":[147],"thus":[151],"encoding":[152],"feature.":[159],"Secondly,":[160],"design":[162],"reason":[169],"dependencies":[171],"queries;":[175],"this":[176],"enables":[177],"only":[181],"focus":[182],"on":[183,210],"query-level":[185],"interaction.":[186],"Finally,":[187],"use":[189],"decoder":[192],"gradually":[194],"refine":[195],"image":[197],"features":[198,203],"reasoned":[201],"tasks.":[206],"Extensive":[207],"experiment":[208],"results":[209],"two":[211],"datasets":[214],"(NYUD-v2":[215],"PASCAL-Context)":[217],"show":[218],"proposed":[221],"method":[222],"an":[224],"effective":[225],"approach":[226],"achieves":[228],"state-of-the-art":[229],"results.":[230],"Code":[231],"models":[233],"available":[235],"at":[236],"<uri":[237],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[238],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/yangyangxu0/MQTransformer</uri>":[239],".":[240]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":24},{"year":2024,"cited_by_count":27},{"year":2023,"cited_by_count":7}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
