{"id":"https://openalex.org/W4415190871","doi":"https://doi.org/10.1109/iccv51701.2025.00418","title":"TurboTrain: Towards Efficient and Balanced Multi-Task Learning for Multi-Agent Perception and Prediction","display_name":"TurboTrain: Towards Efficient and Balanced Multi-Task Learning for Multi-Agent Perception and Prediction","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4415190871","doi":"https://doi.org/10.1109/iccv51701.2025.00418"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.00418","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00418","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.04682","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025362732","display_name":"Zewei Zhou","orcid":"https://orcid.org/0000-0002-7378-9810"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zewei Zhou","raw_affiliation_strings":["University of California,Los Angeles"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007649701","display_name":"Seth Z. Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Seth Z. Zhao","raw_affiliation_strings":["University of California,Los Angeles"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086254443","display_name":"Tianhui Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tianhui Cai","raw_affiliation_strings":["University of California,Los Angeles"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012295217","display_name":"Zhiyu Huang","orcid":"https://orcid.org/0000-0003-1592-7215"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhiyu Huang","raw_affiliation_strings":["University of California,Los Angeles"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033444412","display_name":"Bolei Zhou","orcid":"https://orcid.org/0000-0003-4030-0684"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bolei Zhou","raw_affiliation_strings":["University of California,Los Angeles"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101866439","display_name":"Jiaqi Ma","orcid":"https://orcid.org/0000-0001-8491-1968"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiaqi Ma","raw_affiliation_strings":["University of California,Los Angeles"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5025362732"],"corresponding_institution_ids":["https://openalex.org/I161318765"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14264426,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4391","last_page":"4402"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9650999903678894,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9621999859809875,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6295999884605408},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.6237999796867371},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6110000014305115},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.4796000123023987},{"id":"https://openalex.org/keywords/downstream","display_name":"Downstream (manufacturing)","score":0.31949999928474426}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7042999863624573},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6295999884605408},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.6237999796867371},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6110000014305115},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5688999891281128},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4796000123023987},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46619999408721924},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.31949999928474426},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.30399999022483826},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.29010000824928284},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.00418","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00418","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2508.04682","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.04682","pdf_url":"https://arxiv.org/pdf/2508.04682","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2508.04682","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.04682","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.04682","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.04682","pdf_url":"https://arxiv.org/pdf/2508.04682","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"End-to-end":[0],"training":[1,13,35,71,85,89],"of":[2,112],"multi-agent":[3,38,48,114,127],"systems":[4],"offers":[5],"significant":[6],"advantages":[7],"in":[8],"improving":[9,92],"multi-task":[10,60,138],"performance.":[11,93],"However,":[12],"such":[14],"models":[15],"remains":[16],"challenging":[17],"and":[18,23,33,40,57,81,91,104,116,129,143],"requires":[19],"extensive":[20],"manual":[21],"design":[22],"monitoring.":[24],"In":[25],"this":[26],"work,":[27],"we":[28],"introduce":[29],"TurboTrain,":[30],"a":[31,47,58,98],"novel":[32],"efficient":[34],"framework":[36,74],"for":[37,78],"perception":[39,115],"prediction.":[41,144],"TurboTrain":[42,96],"comprises":[43],"two":[44],"key":[45],"components:":[46],"spatiotemporal":[49,126],"pretraining":[50,123],"scheme":[51],"based":[52,63],"on":[53,64,97],"masked":[54],"reconstruction":[55],"learning":[56,61,139],"balanced":[59,137],"strategy":[62,140],"gradient":[65],"conflict":[66],"suppression.":[67],"By":[68],"streamlining":[69],"the":[70,76,110,135],"process,":[72],"our":[73],"eliminates":[75],"need":[77],"manually":[79],"designing":[80],"tuning":[82],"complex":[83],"multi-stage":[84],"pipelines,":[86],"substantially":[87],"reducing":[88],"time":[90],"We":[94],"evaluate":[95],"real-world":[99],"cooperative":[100],"driving":[101],"dataset,":[102],"V2XPnP-Seq,":[103],"demonstrate":[105],"that":[106,122],"it":[107],"further":[108],"improves":[109],"performance":[111],"state-of-the-art":[113],"prediction":[117],"models.":[118],"Our":[119],"results":[120],"highlight":[121],"effectively":[124],"captures":[125],"features":[128],"significantly":[130],"benefits":[131],"downstream":[132],"tasks.":[133],"Moreover,":[134],"proposed":[136],"enhances":[141],"detection":[142]},"counts_by_year":[],"updated_date":"2026-05-06T06:03:25.996018","created_date":"2025-10-15T00:00:00"}
