{"id":"https://openalex.org/W7155046783","doi":"https://doi.org/10.48550/arxiv.2604.18037","title":"HABIT: Chrono-Synergia Robust Progressive Learning Framework for Composed Image Retrieval","display_name":"HABIT: Chrono-Synergia Robust Progressive Learning Framework for Composed Image Retrieval","publication_year":2026,"publication_date":"2026-04-20","ids":{"openalex":"https://openalex.org/W7155046783","doi":"https://doi.org/10.48550/arxiv.2604.18037"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18037","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18037","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18037","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134189417","display_name":"Zixu Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zixu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134181244","display_name":"Yupeng Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yupeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134196302","display_name":"Zhiwei Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zhiwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134160206","display_name":"Shiqi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shiqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126005311","display_name":"Qinlei Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Qinlei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134201651","display_name":"Zhiheng Fu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Zhiheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134134786","display_name":"Yinwei Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Yinwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.7763000130653381,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.7763000130653381,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.05400000140070915,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.04190000146627426,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.7113000154495239},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6744999885559082},{"id":"https://openalex.org/keywords/content-based-image-retrieval","display_name":"Content-based image retrieval","score":0.4081999957561493},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.3930000066757202},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.3790999948978424},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.37400001287460327},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3668000102043152},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35600000619888306}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8026999831199646},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.7113000154495239},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6744999885559082},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6013000011444092},{"id":"https://openalex.org/C2780052074","wikidata":"https://www.wikidata.org/wiki/Q1128648","display_name":"Content-based image retrieval","level":4,"score":0.4081999957561493},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.40630000829696655},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4043999910354614},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3930000066757202},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3790999948978424},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.37400001287460327},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3668000102043152},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35600000619888306},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.35040000081062317},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3325999975204468},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3028999865055084},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.26429998874664307},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.26089999079704285},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.2581999897956848},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18037","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18037","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18037","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18037","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Composed":[0],"Image":[1],"Retrieval":[2],"(CIR)":[3],"is":[4],"a":[5,20,25,46,105,166],"flexible":[6],"image":[7,18,27,113],"retrieval":[8,219],"paradigm":[9],"that":[10,152,205],"enables":[11],"users":[12],"to":[13,96,179],"accurately":[14],"locate":[15],"the":[16,54,65,84,92,123,133,140,144,155,160,170,192],"target":[17,145],"through":[19],"multimodal":[21],"query":[22],"composed":[23,88,112,141],"of":[24,87,118,136,194],"reference":[26],"and":[28,41,68,91,143,172,183,218],"modification":[29,97,157],"text.":[30],"Although":[31],"this":[32,77],"task":[33],"has":[34],"demonstrated":[35],"promising":[36],"applications":[37],"in":[38,49,71],"personalized":[39],"search":[40],"recommendation":[42],"systems,":[43],"it":[44],"encounters":[45],"severe":[47],"challenge":[48],"practical":[50],"scenarios":[51],"known":[52],"as":[53],"Noise":[55],"Triplet":[56],"Correspondence":[57],"(NTC)":[58],"problem.":[59],"This":[60],"issue":[61],"primarily":[62],"arises":[63],"from":[64],"high":[66],"cost":[67],"subjectivity":[69],"involved":[70],"annotating":[72],"triplet":[73],"data.":[74],"To":[75,99],"address":[76],"problem,":[78],"we":[79,103],"identify":[80],"two":[81,119,200],"central":[82],"challenges:":[83],"precise":[85],"estimation":[86],"semantic":[89],"discrepancy":[90],"insufficient":[93],"progressive":[94],"adaptation":[95],"discrepancy.":[98],"tackle":[100],"these":[101],"challenges,":[102],"propose":[104],"cHrono-synergiA":[106],"roBust":[107],"progressIve":[108],"learning":[109,190],"framework":[110],"for":[111],"reTrieval":[114],"(HABIT),":[115],"which":[116],"consists":[117],"core":[120],"modules.":[121],"First,":[122],"Mutual":[124],"Knowledge":[125],"Estimation":[126],"Module":[127,164],"quantifies":[128],"sample":[129],"cleanliness":[130],"by":[131],"calculating":[132],"Transition":[134],"Rate":[135],"mutual":[137],"information":[138],"between":[139,169],"feature":[142],"image,":[146],"thereby":[147],"effectively":[148],"identifying":[149],"clean":[150],"samples":[151],"align":[153],"with":[154],"intended":[156],"semantics.":[158],"Second,":[159],"Dual-consistency":[161],"Progressive":[162],"Learning":[163],"introduces":[165],"collaborative":[167],"mechanism":[168],"historical":[171],"current":[173],"models,":[174],"simulating":[175],"human":[176],"habit":[177],"formation":[178],"retain":[180],"good":[181],"habits":[182],"calibrate":[184],"bad":[185],"habits,":[186],"ultimately":[187],"enabling":[188],"robust":[189],"under":[191,211],"presence":[193],"NTC.":[195],"Extensive":[196],"experiments":[197],"conducted":[198],"on":[199],"standard":[201],"CIR":[202],"datasets":[203],"demonstrate":[204],"HABIT":[206],"significantly":[207],"outperforms":[208],"most":[209],"methods":[210],"various":[212],"noise":[213],"ratios,":[214],"exhibiting":[215],"superior":[216],"robustness":[217],"performance.":[220],"Codes":[221],"are":[222],"available":[223],"at":[224],"https://github.com/Lee-zixu/HABIT":[225]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-22T00:00:00"}
