{"id":"https://openalex.org/W4417073155","doi":"https://doi.org/10.1145/3743093.3771037","title":"SAFE-AKT: Kazakh Image-Text Retrieval via Semantic-Agnostic Feature Enhancement and Adaptive Knowledge Transfer","display_name":"SAFE-AKT: Kazakh Image-Text Retrieval via Semantic-Agnostic Feature Enhancement and Adaptive Knowledge Transfer","publication_year":2025,"publication_date":"2025-12-06","ids":{"openalex":"https://openalex.org/W4417073155","doi":"https://doi.org/10.1145/3743093.3771037"},"language":null,"primary_location":{"id":"doi:10.1145/3743093.3771037","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3743093.3771037","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3743093.3771037","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Multimedia in Asia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3743093.3771037","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100424734","display_name":"Ping Hu","orcid":"https://orcid.org/0000-0003-1122-4395"},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ping Hu","raw_affiliation_strings":["School of Computer Science and Technology, Xinjiang University, Urumqi, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xinjiang University, Urumqi, China","institution_ids":["https://openalex.org/I96908189"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100635854","display_name":"Zhang Cao","orcid":"https://orcid.org/0009-0009-3767-9081"},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqun Cao","raw_affiliation_strings":["School of Computer Science and Technology, Xinjiang University, Urumqi, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xinjiang University, Urumqi, China","institution_ids":["https://openalex.org/I96908189"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062833659","display_name":"Changle Yin","orcid":"https://orcid.org/0009-0002-7846-8597"},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changle Yin","raw_affiliation_strings":["School of Computer Science and Technology, Xinjiang University, Urumqi, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xinjiang University, Urumqi, China","institution_ids":["https://openalex.org/I96908189"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062079798","display_name":"Mingze Xu","orcid":"https://orcid.org/0009-0001-8931-5775"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minqiang Xu","raw_affiliation_strings":["National Engineering Research Center of Speech and Language Information Processing, IFlytek, University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center of Speech and Language Information Processing, IFlytek, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102248796","display_name":"Jingjing He","orcid":"https://orcid.org/0009-0004-4307-0778"},"institutions":[{"id":"https://openalex.org/I4210103115","display_name":"Xinjiang Institute of Ecology and Geography","ror":"https://ror.org/01a8ev928","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210103115"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing He","raw_affiliation_strings":["The Document and Information Center, Xinjiang Institute of Ecology and Geography Chinese Academy of Science, Urumqi, China"],"affiliations":[{"raw_affiliation_string":"The Document and Information Center, Xinjiang Institute of Ecology and Geography Chinese Academy of Science, Urumqi, China","institution_ids":["https://openalex.org/I4210103115"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027231197","display_name":"Lumei Zhou","orcid":"https://orcid.org/0000-0001-8031-9609"},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lumei Zhou","raw_affiliation_strings":["School of Computer Science and Technology, Xinjiang University, Urumqi, Xinjiang, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xinjiang University, Urumqi, Xinjiang, China","institution_ids":["https://openalex.org/I96908189"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100424734"],"corresponding_institution_ids":["https://openalex.org/I96908189"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41105994,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7958999872207642,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7958999872207642,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.06650000065565109,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.03480000048875809,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kazakh","display_name":"Kazakh","score":0.9812999963760376},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5485000014305115},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.5135999917984009},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3508000075817108},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.311599999666214},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.2996000051498413},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.29739999771118164}],"concepts":[{"id":"https://openalex.org/C2781297163","wikidata":"https://www.wikidata.org/wiki/Q9252","display_name":"Kazakh","level":2,"score":0.9812999963760376},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7943000197410583},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5773000121116638},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5485000014305115},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.5135999917984009},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3603000044822693},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3508000075817108},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33320000767707825},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29350000619888306},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.2630000114440918},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.25290000438690186},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2522999942302704},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3743093.3771037","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3743093.3771037","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3743093.3771037","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Multimedia in Asia","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3743093.3771037","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3743093.3771037","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3743093.3771037","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Multimedia in Asia","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320325419","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4417073155.pdf","grobid_xml":"https://content.openalex.org/works/W4417073155.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W2946417913","https://openalex.org/W2948947170","https://openalex.org/W2963140444","https://openalex.org/W2963909453","https://openalex.org/W2964303116","https://openalex.org/W3035390927","https://openalex.org/W3096437212","https://openalex.org/W3105214104","https://openalex.org/W3156892778","https://openalex.org/W3174010726","https://openalex.org/W3177654849","https://openalex.org/W3213148312","https://openalex.org/W3213454282","https://openalex.org/W4224903957","https://openalex.org/W4283365658","https://openalex.org/W4284896388","https://openalex.org/W4293567540","https://openalex.org/W4312309807","https://openalex.org/W4375869474","https://openalex.org/W4385696946","https://openalex.org/W4386065462","https://openalex.org/W4386065512","https://openalex.org/W4386072392","https://openalex.org/W4387999284","https://openalex.org/W4389520022","https://openalex.org/W4389524249","https://openalex.org/W4391941146","https://openalex.org/W4393178573","https://openalex.org/W4403667998","https://openalex.org/W4403707460","https://openalex.org/W4407290098","https://openalex.org/W4408520851","https://openalex.org/W4409346697","https://openalex.org/W4409369175","https://openalex.org/W4410854502","https://openalex.org/W4411262363","https://openalex.org/W4412069965"],"related_works":[],"abstract_inverted_index":{"Kazakh":[0,24,38,66,91,111,144,155,164,170],"image-text":[1,67,139,156,171],"retrieval":[2,68],"is":[3],"a":[4,64],"challenging":[5],"task":[6],"with":[7,26],"no":[8],"dedicated":[9],"research":[10],"to":[11,33,86,109,142,150,159],"date.":[12],"Although":[13],"existing":[14,196],"multilingual":[15],"vision-language":[16],"pretraining":[17],"models":[18],"provide":[19],"limited":[20],"support":[21],"for":[22],"aligning":[23],"text":[25,102],"images,":[27],"their":[28],"performance":[29],"remains":[30],"poor":[31],"due":[32],"the":[34,41,100,106,120,123,128,143,161,168,184,187],"scarcity":[35,162],"of":[36,55,122,136,163],"annotated":[37],"resources":[39],"and":[40,75,96,126,178,186,199],"complex":[42],"expression":[43,94],"patterns":[44],"arising":[45],"from":[46,90],"its":[47],"agglutinative":[48],"linguistic":[49],"nature,":[50],"which":[51],"hinder":[52],"accurate":[53],"modeling":[54],"text-image":[56],"alignment.":[57,157],"To":[58],"address":[59,160],"these":[60],"challenges,":[61],"we":[62,166],"propose":[63],"new":[65,201],"framework":[69],"that":[70,191],"integrates":[71],"Semantic-Agnostic":[72],"Feature":[73],"Enhancement":[74],"Adaptive":[76],"Knowledge":[77],"Transfer":[78],"(SAFE-AKT).":[79],"SAFE":[80],"employs":[81],"an":[82],"adversarial":[83],"training":[84],"strategy":[85],"generate":[87],"semantic-agnostic":[88],"features":[89],"texts":[92],"(e.g.,":[93],"patterns)":[95],"incorporates":[97],"them":[98],"into":[99],"kazakh":[101],"encoding":[103],"process,":[104],"enhancing":[105],"model\u2019s":[107],"robustness":[108],"diverse":[110],"expressions.":[112],"AKT":[113],"estimates":[114],"sample-level":[115],"alignment":[116,140],"confidence":[117],"by":[118],"computing":[119],"entropy":[121],"teacher":[124],"distribution":[125],"weights":[127],"KL":[129],"divergence":[130],"loss":[131],"accordingly,":[132],"enabling":[133],"effective":[134],"transfer":[135],"high-quality":[137],"English":[138],"knowledge":[141],"representation":[145],"space":[146],"while":[147],"mitigating":[148],"overfitting":[149],"low-confidence":[151],"samples,":[152],"thereby":[153],"improving":[154],"Meanwhile,":[158],"data,":[165],"construct":[167],"first":[169],"dataset,":[172],"Flickr30k-kaz,":[173],"based":[174],"on":[175,183],"machine":[176],"translation":[177],"manual":[179],"refinement.":[180],"Experimental":[181],"results":[182],"Flickr30k-kaz":[185],"Multi30K":[188],"benchmark":[189],"demonstrate":[190],"our":[192],"method":[193],"significantly":[194],"outperforms":[195],"state-of-the-art":[197],"approaches":[198],"achieves":[200],"best":[202],"performance.":[203]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-12-06T00:00:00"}
