{"id":"https://openalex.org/W4205865775","doi":"https://doi.org/10.1109/tip.2022.3141251","title":"Multi-Modal Convolutional Dictionary Learning","display_name":"Multi-Modal Convolutional Dictionary Learning","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4205865775","doi":"https://doi.org/10.1109/tip.2022.3141251","pmid":"https://pubmed.ncbi.nlm.nih.gov/35025741"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2022.3141251","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2022.3141251","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Fangyuan Gao","orcid":"https://orcid.org/0000-0002-1225-2067"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fangyuan Gao","raw_affiliation_strings":["School of Cyber Science and Technology, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Cyber Science and Technology, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xin Deng","orcid":"https://orcid.org/0000-0002-4708-6572"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Deng","raw_affiliation_strings":["School of Cyber Science and Technology, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Cyber Science and Technology, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Mai Xu","orcid":"https://orcid.org/0000-0002-0277-3301"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mai Xu","raw_affiliation_strings":["Department of Electrical Information Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Information Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jingyi Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingyi Xu","raw_affiliation_strings":["Department of Electrical Information Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Information Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":null,"display_name":"Pier Luigi Dragotti","orcid":"https://orcid.org/0000-0002-6073-2807"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Pier Luigi Dragotti","raw_affiliation_strings":["Department of Electrical and Electronic Engineering, Imperial College London, London, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronic Engineering, Imperial College London, London, U.K","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":6.4457,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.98198556,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"31","issue":null,"first_page":"1325","last_page":"1339"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.6172999739646912,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.6172999739646912,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.27900001406669617,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.011900000274181366,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7132999897003174},{"id":"https://openalex.org/keywords/dictionary-learning","display_name":"Dictionary learning","score":0.6694999933242798},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6603999733924866},{"id":"https://openalex.org/keywords/k-svd","display_name":"K-SVD","score":0.6157000064849854},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5663999915122986},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5157999992370605},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.49799999594688416},{"id":"https://openalex.org/keywords/convolutional-code","display_name":"Convolutional code","score":0.49309998750686646},{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.4674000144004822}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7911999821662903},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7732999920845032},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7132999897003174},{"id":"https://openalex.org/C2988886741","wikidata":"https://www.wikidata.org/wiki/Q25304494","display_name":"Dictionary learning","level":3,"score":0.6694999933242798},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6603999733924866},{"id":"https://openalex.org/C154771677","wikidata":"https://www.wikidata.org/wiki/Q17098361","display_name":"K-SVD","level":3,"score":0.6157000064849854},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5663999915122986},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5157999992370605},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.49799999594688416},{"id":"https://openalex.org/C157899210","wikidata":"https://www.wikidata.org/wiki/Q1395022","display_name":"Convolutional code","level":3,"score":0.49309998750686646},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.4674000144004822},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.429500013589859},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.4147000014781952},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.396699994802475},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3833000063896179},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3792000114917755},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.35280001163482666},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.3517000079154968},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.2962000072002411},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.29420000314712524},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2703999876976013},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2696000039577484},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.25780001282691956}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2022.3141251","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2022.3141251","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:35025741","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35025741","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W1897123318","https://openalex.org/W1948643287","https://openalex.org/W1964641132","https://openalex.org/W1973794531","https://openalex.org/W2000355138","https://openalex.org/W2005876975","https://openalex.org/W2014711337","https://openalex.org/W2040833130","https://openalex.org/W2056370875","https://openalex.org/W2069479606","https://openalex.org/W2078204800","https://openalex.org/W2099749431","https://openalex.org/W2115429828","https://openalex.org/W2117259536","https://openalex.org/W2120824855","https://openalex.org/W2121058967","https://openalex.org/W2127271355","https://openalex.org/W2133665775","https://openalex.org/W2134789674","https://openalex.org/W2139182243","https://openalex.org/W2146353910","https://openalex.org/W2153663612","https://openalex.org/W2160547390","https://openalex.org/W2164278908","https://openalex.org/W2190662802","https://openalex.org/W2194818953","https://openalex.org/W2202656999","https://openalex.org/W2209762097","https://openalex.org/W2219841864","https://openalex.org/W2294512729","https://openalex.org/W2344536484","https://openalex.org/W2492439964","https://openalex.org/W2532801510","https://openalex.org/W2581851997","https://openalex.org/W2596585942","https://openalex.org/W2612585477","https://openalex.org/W2613955579","https://openalex.org/W2760586727","https://openalex.org/W2773809991","https://openalex.org/W2798401637","https://openalex.org/W2803751491","https://openalex.org/W2811308087","https://openalex.org/W2820727372","https://openalex.org/W2902747464","https://openalex.org/W2912581987","https://openalex.org/W2924878362","https://openalex.org/W2963980268","https://openalex.org/W2998320011","https://openalex.org/W3013345642","https://openalex.org/W3014859219","https://openalex.org/W3035467948","https://openalex.org/W3046194589","https://openalex.org/W3049253011","https://openalex.org/W6724411756","https://openalex.org/W6764414574"],"related_works":[],"abstract_inverted_index":{"Convolutional":[0],"dictionary":[1,22,29,60,74,106,198,209,225],"learning":[2,30,61,75,210,226,230],"has":[3],"become":[4],"increasingly":[5],"popular":[6],"in":[7,103,177,190],"signal":[8],"and":[9,49,83,112,174,200,228],"image":[10,38,81,90,217],"processing":[11,39,218],"for":[12,108,116,133],"its":[13],"ability":[14],"to":[15,57,169],"overcome":[16],"the":[17,34,89,113,125,128,134,139,151,162,172,178,196,201,207],"limitations":[18],"of":[19,166,206],"traditional":[20],"patch-based":[21],"learning.":[23],"Although":[24],"most":[25],"studies":[26],"on":[27,33,161,214],"convolutional":[28,59,73,101,129,197],"mainly":[31],"focus":[32],"unimodal":[35],"case,":[36],"real-world":[37],"tasks":[40],"usually":[41],"involve":[42],"images":[43,147],"from":[44,150],"multiple":[45],"modalities,":[46,143],"e.g.,":[47],"visible":[48],"near-infrared":[50],"(NIR)":[51],"images.":[52],"Thus,":[53],"it":[54],"is":[55,97,107,115,122,212],"necessary":[56],"explore":[58],"across":[62,141],"different":[63,80,142],"modalities.":[64],"In":[65,92],"this":[66,93],"paper,":[67],"we":[68],"propose":[69,155],"a":[70,156],"novel":[71],"multi-modal":[72],"algorithm,":[76],"which":[77,104],"efficiently":[78],"correlates":[79],"modalities":[82],"fully":[84],"considers":[85],"neighborhood":[86],"information":[87],"at":[88],"level.":[91],"model,":[94],"each":[95],"modality":[96],"represented":[98],"by":[99,124],"two":[100],"dictionaries,":[102],"one":[105],"common":[109,135,173],"feature":[110,118],"representation":[111],"other":[114],"unique":[117,175],"representation.":[119],"The":[120,204],"model":[121,188],"constrained":[123],"requirement":[126],"that":[127,145,186],"sparse":[130],"representations":[131],"(CSRs)":[132],"features":[136],"should":[137],"be":[138],"same":[140,152],"considering":[144],"these":[146],"are":[148],"captured":[149],"scene.":[153],"We":[154,184],"new":[157],"training":[158,235],"method":[159,165],"based":[160,231],"alternating":[163],"direction":[164],"multipliers":[167],"(ADMM)":[168],"alternatively":[170],"learn":[171],"dictionaries":[176],"discrete":[179],"Fourier":[180],"transform":[181],"(DFT)":[182],"domain.":[183],"show":[185],"our":[187],"converges":[189],"less":[191],"than":[192,223],"20":[193],"iterations":[194],"between":[195],"updating":[199],"CSRs":[202],"calculation.":[203],"effectiveness":[205],"proposed":[208],"algorithm":[211],"demonstrated":[213],"various":[215],"multimodal":[216],"tasks,":[219],"achieves":[220],"better":[221],"performance":[222],"both":[224],"methods":[227,232],"deep":[229],"with":[233],"limited":[234],"data.":[236]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":2}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2022-01-25T00:00:00"}
