{"id":"https://openalex.org/W4392902325","doi":"https://doi.org/10.1109/access.2024.3378095","title":"Interpolating the Text-to-Image Correspondence Based on Phonetic and Phonological Similarities for Nonword-to-Image Generation","display_name":"Interpolating the Text-to-Image Correspondence Based on Phonetic and Phonological Similarities for Nonword-to-Image Generation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4392902325","doi":"https://doi.org/10.1109/access.2024.3378095"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3378095","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3378095","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10473073.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10473073.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031528895","display_name":"Chihaya Matsuhira","orcid":"https://orcid.org/0000-0003-2453-4560"},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Chihaya Matsuhira","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","institution_ids":["https://openalex.org/I60134161"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102907439","display_name":"Marc A. Kastner","orcid":"https://orcid.org/0000-0002-9193-5973"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]},{"id":"https://openalex.org/I39012071","display_name":"Kyoto College of Graduate Studies for Informatics","ror":"https://ror.org/05mzj8a56","country_code":"JP","type":"education","lineage":["https://openalex.org/I39012071"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Marc A. Kastner","raw_affiliation_strings":["Graduate School of Informatics, Kyoto University, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Kyoto University, Kyoto, Japan","institution_ids":["https://openalex.org/I39012071","https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047823141","display_name":"Takahiro Komamizu","orcid":null},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takahiro Komamizu","raw_affiliation_strings":["Mathematical and Data Science Center, Nagoya University, Nagoya, Aichi, Japan"],"affiliations":[{"raw_affiliation_string":"Mathematical and Data Science Center, Nagoya University, Nagoya, Aichi, Japan","institution_ids":["https://openalex.org/I60134161"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036735172","display_name":"Takatsugu Hirayama","orcid":"https://orcid.org/0000-0001-6290-9680"},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]},{"id":"https://openalex.org/I84985371","display_name":"University of Human Environments","ror":"https://ror.org/029smmd76","country_code":"JP","type":"education","lineage":["https://openalex.org/I84985371"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takatsugu Hirayama","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","University of Human Environments, Okazaki, Aichi, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","institution_ids":["https://openalex.org/I60134161"]},{"raw_affiliation_string":"University of Human Environments, Okazaki, Aichi, Japan","institution_ids":["https://openalex.org/I84985371"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058196829","display_name":"Keisuke Doman","orcid":null},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]},{"id":"https://openalex.org/I98940699","display_name":"Chukyo University","ror":"https://ror.org/04ajrmg05","country_code":"JP","type":"education","lineage":["https://openalex.org/I98940699"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Keisuke Doman","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","Chukyo University, Toyota, Aichi, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","institution_ids":["https://openalex.org/I60134161"]},{"raw_affiliation_string":"Chukyo University, Toyota, Aichi, Japan","institution_ids":["https://openalex.org/I98940699"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027960360","display_name":"Yasutomo Kawanishi","orcid":"https://orcid.org/0000-0002-3799-4550"},"institutions":[{"id":"https://openalex.org/I4210110652","display_name":"RIKEN","ror":"https://ror.org/01sjwvz98","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652"]},{"id":"https://openalex.org/I46980622","display_name":"Kyoto Seika University","ror":"https://ror.org/05g4f0342","country_code":"JP","type":"education","lineage":["https://openalex.org/I46980622"]},{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yasutomo Kawanishi","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","RIKEN, Seika, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","institution_ids":["https://openalex.org/I60134161"]},{"raw_affiliation_string":"RIKEN, Seika, Kyoto, Japan","institution_ids":["https://openalex.org/I46980622","https://openalex.org/I4210110652"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034941095","display_name":"Ichiro Ide","orcid":"https://orcid.org/0000-0003-3942-9296"},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Ichiro Ide","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University, Nagoya, Aichi, Japan","institution_ids":["https://openalex.org/I60134161"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5031528895"],"corresponding_institution_ids":["https://openalex.org/I60134161"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.7271,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.85842257,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"12","issue":null,"first_page":"41299","last_page":"41316"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6711106896400452},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.6050408482551575},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5969533920288086},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5210748910903931},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5193353891372681},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3922022581100464},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32784420251846313}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6711106896400452},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.6050408482551575},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5969533920288086},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5210748910903931},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5193353891372681},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3922022581100464},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32784420251846313},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3378095","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3378095","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10473073.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:1ae819dd8f17465891e7e43da4164d71","is_oa":true,"landing_page_url":"https://doaj.org/article/1ae819dd8f17465891e7e43da4164d71","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 41299-41316 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3378095","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3378095","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10473073.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2983449479","display_name":null,"funder_award_id":"Scientific Research","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3459562248","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3631313543","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320308943","funder_display_name":"Microsoft Research"},{"id":"https://openalex.org/G4943039908","display_name":null,"funder_award_id":"22H03612","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4954916424","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6879153672","display_name":null,"funder_award_id":"JPMJFS2120","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8430481527","display_name":null,"funder_award_id":"Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320308943","display_name":"Microsoft Research","ror":"https://ror.org/00d0nc645"},{"id":"https://openalex.org/F4320327550","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47"},{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"},{"id":"https://openalex.org/F4320337013","display_name":"Information Technology Center, Nagoya University","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392902325.pdf","grobid_xml":"https://content.openalex.org/works/W4392902325.grobid-xml"},"referenced_works_count":49,"referenced_works":["https://openalex.org/W4941964","https://openalex.org/W46679369","https://openalex.org/W1861492603","https://openalex.org/W2061625509","https://openalex.org/W2099869405","https://openalex.org/W2137838732","https://openalex.org/W2183341477","https://openalex.org/W2316803017","https://openalex.org/W2781461271","https://openalex.org/W2791226589","https://openalex.org/W2886641317","https://openalex.org/W2962784628","https://openalex.org/W2973029704","https://openalex.org/W2978017171","https://openalex.org/W3110019360","https://openalex.org/W3118580076","https://openalex.org/W3118608800","https://openalex.org/W3129576130","https://openalex.org/W4224035735","https://openalex.org/W4243766748","https://openalex.org/W4281485151","https://openalex.org/W4284898017","https://openalex.org/W4285131243","https://openalex.org/W4285142052","https://openalex.org/W4299814950","https://openalex.org/W4302470888","https://openalex.org/W4312282373","https://openalex.org/W4312715377","https://openalex.org/W4312933868","https://openalex.org/W4321275178","https://openalex.org/W4323570466","https://openalex.org/W4385245566","https://openalex.org/W4385805112","https://openalex.org/W4387698264","https://openalex.org/W6600193324","https://openalex.org/W6601894380","https://openalex.org/W6631190155","https://openalex.org/W6679045638","https://openalex.org/W6747389005","https://openalex.org/W6755207826","https://openalex.org/W6765779288","https://openalex.org/W6768851824","https://openalex.org/W6790978476","https://openalex.org/W6791353385","https://openalex.org/W6809885388","https://openalex.org/W6810940779","https://openalex.org/W6838620345","https://openalex.org/W6838639034","https://openalex.org/W6850106008"],"related_works":["https://openalex.org/W405926467","https://openalex.org/W4402742086","https://openalex.org/W1965611333","https://openalex.org/W4404882811","https://openalex.org/W2032228042","https://openalex.org/W1505098369","https://openalex.org/W1999916109","https://openalex.org/W3132349679","https://openalex.org/W37840851","https://openalex.org/W4251713484"],"abstract_inverted_index":{"Text-to-Image":[0],"(T2I)":[1],"generation":[2,70,112,131,140,162],"is":[3,41],"the":[4,23,47,92,137,160,172],"task":[5],"of":[6,25,49,95,147],"synthesizing":[7],"images":[8,142],"corresponding":[9],"to":[10,43,108],"a":[11,59,110,121,168],"given":[12],"text":[13,50],"input.":[14],"The":[15,118],"recent":[16],"innovations":[17],"in":[18,46,66,84],"artificial":[19],"intelligence":[20],"have":[21,55],"enhanced":[22],"capacity":[24],"conventional":[26],"T2I":[27,111,130],"generation,":[28],"yielding":[29],"more":[30,32,151],"and":[31,87,101,105],"powerful":[33],"models":[34,80],"day":[35],"by":[36],"day.":[37],"However,":[38],"their":[39,99],"behavior":[40,62],"known":[42],"become":[44],"unstable":[45],"face":[48],"inputs":[51],"containing":[52],"nonwords":[53,97],"that":[54,136,143],"no":[56],"definition":[57],"within":[58],"language.":[60],"This":[61,89],"not":[63,72],"only":[64],"results":[65,163],"situations":[67],"where":[68],"image":[69,161],"does":[71],"match":[73,164],"human":[74,93,165],"expectations":[75],"but":[76],"also":[77,157],"hinders":[78],"these":[79],"from":[81],"being":[82],"utilized":[83],"psycholinguistic":[85],"applications":[86],"simulations.":[88],"paper":[90],"exploits":[91],"nature":[94],"associating":[96],"with":[98],"phonetically":[100,148],"phonologically":[102],"similar":[103,149],"words":[104,150],"uses":[106],"it":[107],"propose":[109],"framework":[113,119],"robust":[114],"against":[115],"nonword":[116],"inputs.":[117],"comprises":[120],"phonetics-aware":[122],"language":[123],"model":[124],"as":[125,127],"well":[126],"an":[128],"adjusted":[129],"model.":[132],"Our":[133],"evaluations":[134],"confirm":[135],"proposed":[138],"nonword-to-image":[139],"synthesizes":[141],"depict":[144],"visual":[145],"concepts":[146],"stably":[152],"than":[153,171],"comparative":[154],"methods.":[155],"We":[156],"assess":[158],"how":[159],"expectations,":[166],"showing":[167],"better":[169],"agreement":[170],"phonetics-blind":[173],"baseline.":[174]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
