{"id":"https://openalex.org/W4292241799","doi":"https://doi.org/10.1007/s11263-022-01643-3","title":"Class-Difficulty Based Methods for Long-Tailed Visual Recognition","display_name":"Class-Difficulty Based Methods for Long-Tailed Visual Recognition","publication_year":2022,"publication_date":"2022-08-18","ids":{"openalex":"https://openalex.org/W4292241799","doi":"https://doi.org/10.1007/s11263-022-01643-3"},"language":"en","primary_location":{"id":"doi:10.1007/s11263-022-01643-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-022-01643-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-022-01643-3.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11263-022-01643-3.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038264484","display_name":"Saptarshi Sinha","orcid":"https://orcid.org/0000-0002-5207-1551"},"institutions":[{"id":"https://openalex.org/I65143321","display_name":"Hitachi (Japan)","ror":"https://ror.org/02exqgm79","country_code":"JP","type":"company","lineage":["https://openalex.org/I65143321"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Saptarshi Sinha","raw_affiliation_strings":["Intelligent Vision Research Department, Hitachi Ltd., Kokubunji, 185-8601, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0000-0002-5207-1551","affiliations":[{"raw_affiliation_string":"Intelligent Vision Research Department, Hitachi Ltd., Kokubunji, 185-8601, Tokyo, Japan","institution_ids":["https://openalex.org/I65143321"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112657316","display_name":"Hiroki Ohashi","orcid":null},"institutions":[{"id":"https://openalex.org/I65143321","display_name":"Hitachi (Japan)","ror":"https://ror.org/02exqgm79","country_code":"JP","type":"company","lineage":["https://openalex.org/I65143321"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroki Ohashi","raw_affiliation_strings":["Intelligent Vision Research Department, Hitachi Ltd., Kokubunji, 185-8601, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Vision Research Department, Hitachi Ltd., Kokubunji, 185-8601, Tokyo, Japan","institution_ids":["https://openalex.org/I65143321"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007900897","display_name":"Katsuyuki Nakamura","orcid":"https://orcid.org/0000-0002-8074-2279"},"institutions":[{"id":"https://openalex.org/I65143321","display_name":"Hitachi (Japan)","ror":"https://ror.org/02exqgm79","country_code":"JP","type":"company","lineage":["https://openalex.org/I65143321"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Katsuyuki Nakamura","raw_affiliation_strings":["R &D Group, Hitachi Ltd., Kokubunji, 185-8601, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R &D Group, Hitachi Ltd., Kokubunji, 185-8601, Tokyo, Japan","institution_ids":["https://openalex.org/I65143321"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5038264484"],"corresponding_institution_ids":["https://openalex.org/I65143321"],"apc_list":{"value":2890,"currency":"EUR","value_usd":3690},"apc_paid":{"value":2890,"currency":"EUR","value_usd":3690},"fwci":4.4408,"has_fulltext":true,"cited_by_count":36,"citation_normalized_percentile":{"value":0.95077584,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"130","issue":"10","first_page":"2517","last_page":"2531"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7701916694641113},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.7063071727752686},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6766221523284912},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6142452955245972},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5450229644775391},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5021204948425293},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4956752061843872},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4648856818675995},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43624040484428406},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.12298053503036499}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7701916694641113},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.7063071727752686},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6766221523284912},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6142452955245972},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5450229644775391},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5021204948425293},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4956752061843872},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4648856818675995},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43624040484428406},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.12298053503036499},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11263-022-01643-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-022-01643-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-022-01643-3.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11263-022-01643-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-022-01643-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-022-01643-3.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6000000238418579,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320311508","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4292241799.pdf","grobid_xml":"https://content.openalex.org/works/W4292241799.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W2087240369","https://openalex.org/W2104167780","https://openalex.org/W2108598243","https://openalex.org/W2112796928","https://openalex.org/W2118978333","https://openalex.org/W2132791018","https://openalex.org/W2148143831","https://openalex.org/W2153579005","https://openalex.org/W2194775991","https://openalex.org/W2519882289","https://openalex.org/W2613718673","https://openalex.org/W2895299763","https://openalex.org/W2947380870","https://openalex.org/W2948672349","https://openalex.org/W2952120674","https://openalex.org/W2962933664","https://openalex.org/W2962934715","https://openalex.org/W2963026686","https://openalex.org/W2963212406","https://openalex.org/W2963351448","https://openalex.org/W2963691377","https://openalex.org/W2981188200","https://openalex.org/W2982540584","https://openalex.org/W3034933032","https://openalex.org/W3035054804","https://openalex.org/W3035552357","https://openalex.org/W3097255365","https://openalex.org/W3108105109","https://openalex.org/W4243367342","https://openalex.org/W6744066916","https://openalex.org/W6750523955"],"related_works":["https://openalex.org/W4379231730","https://openalex.org/W2737719445","https://openalex.org/W4389858081","https://openalex.org/W2391251536","https://openalex.org/W4324315429","https://openalex.org/W2501551404","https://openalex.org/W2465918047","https://openalex.org/W4385583601","https://openalex.org/W4366829857","https://openalex.org/W2362198218"],"abstract_inverted_index":{"Abstract":[0],"Long-tailed":[1],"datasets":[2,45,207],"are":[3,83],"very":[4],"frequently":[5],"encountered":[6],"in":[7,67],"real-world":[8,216],"use":[9,133,217],"cases":[10],"where":[11],"few":[12],"classes":[13,32,82,88],"or":[14,19,36,96],"categories":[15],"(known":[16,33],"as":[17,34,183,209],"majority":[18],"head":[20,51],"classes)":[21],"have":[22,56],"higher":[23],"number":[24],"of":[25,75,121,128,137,171],"data":[26,64,157],"samples":[27],"compared":[28],"to":[29,69,89,115,140],"the":[30,50,71,80,85,102,118,125,129,134,168],"other":[31],"minority":[35],"tail":[37,81],"classes).":[38],"Training":[39],"deep":[40],"neural":[41],"networks":[42],"on":[43,179,204],"such":[44,76,182,208],"gives":[46],"results":[47,203],"biased":[48],"towards":[49],"classes.":[52],"So":[53],"far,":[54],"researchers":[55],"come":[57],"up":[58],"with":[59],"multiple":[60,180],"weighted":[61,144,151],"loss":[62,145,197],"and":[63,91,154,190,198,212],"re-sampling":[65],"techniques":[66,77],"efforts":[68],"reduce":[70],"bias.":[72],"However,":[73],"most":[74,86],"assume":[78],"that":[79,101,195,214],"always":[84,106],"difficult":[87],"learn":[90],"therefore":[92],"need":[93],"more":[94],"weightage":[95],"attention.":[97],"Here,":[98],"we":[99,110,132,175],"argue":[100],"assumption":[103],"might":[104],"not":[105],"hold":[107],"true.":[108],"Therefore,":[109],"propose":[111],"a":[112,142,155],"novel":[113,143,156],"approach":[114],"dynamically":[116],"measure":[117],"instantaneous":[119],"difficulty":[120,135,149,162],"each":[122,138],"class":[123,139],"during":[124],"training":[126],"phase":[127],"model.":[130],"Further,":[131],"measures":[136],"design":[141],"technique":[146,159],"called":[147,160],"\u2018class-wise":[148,161],"based":[150,163],"(CDB-W)":[152],"loss\u2019":[153],"sampling":[158,164],"(CDB-S)\u2019.":[165],"To":[166],"verify":[167],"wide-scale":[169],"usability":[170],"our":[172],"CDB":[173],"methods,":[174],"conducted":[176],"extensive":[177],"experiments":[178],"tasks":[181],"image":[184],"classification,":[185],"object":[186],"detection,":[187],"instance":[188],"segmentation":[189],"video-action":[191],"classification.":[192],"Results":[193],"verified":[194],"CDB-W":[196],"CDB-S":[199],"could":[200],"achieve":[201],"state-of-the-art":[202],"many":[205],"class-imbalanced":[206],"ImageNet-LT,":[210],"LVIS":[211],"EGTEA,":[213],"resemble":[215],"cases.":[218]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":12}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
