{"id":"https://openalex.org/W4414871331","doi":"https://doi.org/10.1109/tcsvt.2025.3618279","title":"LoDisc: Learning Global-Local Discriminative Features for Self-Supervised Fine-Grained Visual Recognition","display_name":"LoDisc: Learning Global-Local Discriminative Features for Self-Supervised Fine-Grained Visual Recognition","publication_year":2025,"publication_date":"2025-10-06","ids":{"openalex":"https://openalex.org/W4414871331","doi":"https://doi.org/10.1109/tcsvt.2025.3618279"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2025.3618279","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3618279","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113923514","display_name":"Jialu Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jialu Shi","raw_affiliation_strings":["Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079932099","display_name":"Zhiqiang Wei","orcid":"https://orcid.org/0000-0002-2830-8301"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqiang Wei","raw_affiliation_strings":["Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-2830-8301","affiliations":[{"raw_affiliation_string":"Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058652390","display_name":"Jie Nie","orcid":"https://orcid.org/0000-0003-4952-7666"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Nie","raw_affiliation_strings":["Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0003-4952-7666","affiliations":[{"raw_affiliation_string":"Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100784430","display_name":"Lei Huang","orcid":"https://orcid.org/0000-0003-4087-3677"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Huang","raw_affiliation_strings":["Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0003-4087-3677","affiliations":[{"raw_affiliation_string":"Faculty of Information Science and Engineering, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.9349,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.79675977,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"36","issue":"3","first_page":"3679","last_page":"3692"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.6748999953269958,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.6748999953269958,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.6349999904632568,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.6119999885559082,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7364000082015991},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5924000144004822},{"id":"https://openalex.org/keywords/pretext","display_name":"Pretext","score":0.5738999843597412},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5551000237464905},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.5507000088691711},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.548799991607666},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.5457000136375427},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5274999737739563},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5016999840736389}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7477999925613403},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7364000082015991},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7264999747276306},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5924000144004822},{"id":"https://openalex.org/C2779627259","wikidata":"https://www.wikidata.org/wiki/Q779763","display_name":"Pretext","level":3,"score":0.5738999843597412},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5551000237464905},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.5507000088691711},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.548799991607666},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.5457000136375427},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5274999737739563},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5016999840736389},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4984000027179718},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.459199994802475},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35519999265670776},{"id":"https://openalex.org/C2779321571","wikidata":"https://www.wikidata.org/wiki/Q7936605","display_name":"Visual learning","level":2,"score":0.353300005197525},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.35179999470710754},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.3122999966144562},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.30889999866485596},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3059999942779541},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.29269999265670776},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2734000086784363},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.26989999413490295},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.26750001311302185},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2651999890804291},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.26339998841285706},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3618279","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3618279","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2061520909","display_name":null,"funder_award_id":"2019YFC1408405","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2800808789","display_name":null,"funder_award_id":"ZR2023MF033","funder_id":"https://openalex.org/F4320324174","funder_display_name":"Natural Science Foundation of Shandong Province"},{"id":"https://openalex.org/G3261043767","display_name":null,"funder_award_id":"62472390","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8285579987","display_name":null,"funder_award_id":"No. 62472390","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320324174","display_name":"Natural Science Foundation of Shandong Province","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1928906481","https://openalex.org/W2117539524","https://openalex.org/W2135706578","https://openalex.org/W2138011018","https://openalex.org/W2138621090","https://openalex.org/W2155904486","https://openalex.org/W2171590421","https://openalex.org/W2798991696","https://openalex.org/W2950768109","https://openalex.org/W2962858109","https://openalex.org/W3034865111","https://openalex.org/W3035524453","https://openalex.org/W3145450063","https://openalex.org/W3159481202","https://openalex.org/W3160314846","https://openalex.org/W3171007011","https://openalex.org/W3175156984","https://openalex.org/W3176276772","https://openalex.org/W3204826552","https://openalex.org/W3213639431","https://openalex.org/W4210551401","https://openalex.org/W4285605548","https://openalex.org/W4312295999","https://openalex.org/W4312734625","https://openalex.org/W4312823383","https://openalex.org/W4313056800","https://openalex.org/W4313156423","https://openalex.org/W4316660800","https://openalex.org/W4321021073","https://openalex.org/W4321780048","https://openalex.org/W4376464610","https://openalex.org/W4382239283","https://openalex.org/W4385245566","https://openalex.org/W4386057726","https://openalex.org/W4386065811","https://openalex.org/W4386076385","https://openalex.org/W4386076428","https://openalex.org/W4387682352","https://openalex.org/W4399728346"],"related_works":[],"abstract_inverted_index":{"The":[0,156],"self-supervised":[1,57,63,84],"contrastive":[2,19,58,66],"learning":[3,20,54,59,67],"strategy":[4],"has":[5],"attracted":[6],"considerable":[7],"attention":[8],"due":[9],"to":[10,22,80,148],"its":[11],"exceptional":[12],"ability":[13],"in":[14,115,152],"representation":[15],"learning.":[16],"However,":[17],"current":[18],"tends":[21],"learn":[23],"global":[24,56],"coarse-grained":[25,37],"representations":[26,129],"of":[27,130],"the":[28,83,106,121,126,143],"image":[29],"that":[30,105,120,142],"benefit":[31],"generic":[32],"object":[33,138,164],"recognition,":[34],"whereas":[35],"such":[36],"features":[38],"are":[39,92],"insufficient":[40],"for":[41,162],"fine-grained":[42,52,65,113,127,137],"visual":[43],"recognition.":[44],"In":[45],"this":[46],"paper,":[47],"we":[48],"incorporate":[49],"subtle":[50],"local":[51,75,88,117],"feature":[53,128],"into":[55],"through":[60],"a":[61,70,95,149],"pure":[62],"global-local":[64,122],"framework.":[68],"Specifically,":[69],"novel":[71],"pretext":[72,108],"task":[73,109],"called":[74],"discrimination":[76],"(LoDisc)":[77],"is":[78,159],"proposed":[79,144,157],"explicitly":[81],"supervise":[82],"model\u2019s":[85],"focus":[86],"toward":[87],"pivotal":[89],"regions,":[90],"which":[91],"captured":[93],"by":[94],"simple":[96],"but":[97],"effective":[98,161],"location-wise":[99],"mask":[100],"sampling":[101],"strategy.":[102],"We":[103],"show":[104],"LoDisc":[107],"can":[110,146],"effectively":[111],"enhance":[112],"clues":[114],"important":[116],"regions":[118],"and":[119],"framework":[123],"further":[124],"refines":[125],"images.":[131],"Extensive":[132],"experimental":[133],"results":[134],"on":[135],"different":[136,153],"recognition":[139,165],"tasks":[140],"demonstrate":[141],"method":[145,158],"lead":[147],"decent":[150],"improvement":[151],"evaluation":[154],"settings.":[155],"also":[160],"general":[163],"tasks.":[166]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
