{"id":"https://openalex.org/W4416598150","doi":"https://doi.org/10.48550/arxiv.2511.17429","title":"Semantic and Semiotic Interplays in Text-to-Audio AI: Exploring Cognitive Dynamics and Musical Interactions","display_name":"Semantic and Semiotic Interplays in Text-to-Audio AI: Exploring Cognitive Dynamics and Musical Interactions","publication_year":2025,"publication_date":"2025-11-21","ids":{"openalex":"https://openalex.org/W4416598150","doi":"https://doi.org/10.48550/arxiv.2511.17429"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2511.17429","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.17429","pdf_url":"https://arxiv.org/pdf/2511.17429","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2511.17429","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008918749","display_name":"Guilherme Palermo Coelho","orcid":"https://orcid.org/0000-0002-4641-0684"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Coelho, Guilherme","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5008918749"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.5497999787330627,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.5497999787330627,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.10419999808073044,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13380","display_name":"Sound Studies and Aurality","score":0.05620000138878822,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semiotics","display_name":"Semiotics","score":0.6520000100135803},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.6172999739646912},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.5121999979019165},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.501800000667572},{"id":"https://openalex.org/keywords/constructive","display_name":"Constructive","score":0.45989999175071716},{"id":"https://openalex.org/keywords/transformative-learning","display_name":"Transformative learning","score":0.37779998779296875},{"id":"https://openalex.org/keywords/metacognition","display_name":"Metacognition","score":0.35359999537467957},{"id":"https://openalex.org/keywords/reflexivity","display_name":"Reflexivity","score":0.35010001063346863}],"concepts":[{"id":"https://openalex.org/C139997677","wikidata":"https://www.wikidata.org/wiki/Q60195","display_name":"Semiotics","level":2,"score":0.6520000100135803},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.6172999739646912},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.5260999798774719},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.5121999979019165},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.501800000667572},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.46459999680519104},{"id":"https://openalex.org/C2778701210","wikidata":"https://www.wikidata.org/wiki/Q28130034","display_name":"Constructive","level":3,"score":0.45989999175071716},{"id":"https://openalex.org/C70587473","wikidata":"https://www.wikidata.org/wiki/Q7834111","display_name":"Transformative learning","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.36079999804496765},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3540000021457672},{"id":"https://openalex.org/C118147538","wikidata":"https://www.wikidata.org/wiki/Q1126970","display_name":"Metacognition","level":3,"score":0.35359999537467957},{"id":"https://openalex.org/C13200473","wikidata":"https://www.wikidata.org/wiki/Q2747831","display_name":"Reflexivity","level":2,"score":0.35010001063346863},{"id":"https://openalex.org/C177291462","wikidata":"https://www.wikidata.org/wiki/Q423038","display_name":"Active listening","level":2,"score":0.34619998931884766},{"id":"https://openalex.org/C134141054","wikidata":"https://www.wikidata.org/wiki/Q965415","display_name":"Performative utterance","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.3066999912261963},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.30250000953674316},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.30090001225471497},{"id":"https://openalex.org/C146902061","wikidata":"https://www.wikidata.org/wiki/Q476590","display_name":"Music psychology","level":3,"score":0.28999999165534973},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.2766999900341034},{"id":"https://openalex.org/C207551092","wikidata":"https://www.wikidata.org/wiki/Q508969","display_name":"Cognitive linguistics","level":3,"score":0.27140000462532043},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.26989999413490295},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.25859999656677246},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.2542000114917755}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2511.17429","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.17429","pdf_url":"https://arxiv.org/pdf/2511.17429","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2511.17429","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.17429","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2511.17429","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.17429","pdf_url":"https://arxiv.org/pdf/2511.17429","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,153],"paper":[1,63,104,193],"investigates":[2],"the":[3,23,43,62,83,144,184,198,228],"emerging":[4],"text-to-audio":[5,44,107,201],"paradigm":[6],"in":[7,88,167,215],"artificial":[8],"intelligence":[9],"(AI),":[10],"examining":[11],"its":[12],"transformative":[13],"implications":[14],"for":[15],"musical":[16,70,114,159,190,216],"creation,":[17],"interpretation,":[18],"and":[19,26,49,60,73,96,100,118,128,150,171,183,209,218,230],"cognition.":[20,191],"I":[21],"explore":[22],"complex":[24],"semantic":[25],"semiotic":[27,181],"interplays":[28],"that":[29,106,187],"occur":[30],"when":[31],"descriptive":[32],"natural":[33],"language":[34],"prompts":[35,149,163],"are":[36],"translated":[37],"into":[38],"nuanced":[39,225],"sound":[40],"objects":[41],"across":[42],"modality.":[45],"Drawing":[46],"from":[47],"structuralist":[48],"post-structuralist":[50],"perspectives,":[51],"as":[52,54,111,132,206],"well":[53],"cognitive":[55,76,84,229],"theories":[56],"of":[57,82,93,113,126,169,178,200,227,233],"schema":[58,94],"dynamics":[59,85],"metacognition,":[61],"explores":[64,139],"how":[65,140],"these":[66,141],"AI":[67,108,202],"systems":[68],"reconfigure":[69],"signification":[71],"processes":[72,92],"navigate":[74,143],"established":[75],"frameworks.":[77],"The":[78,103,192],"research":[79],"analyzes":[80],"some":[81],"at":[86],"play":[87],"AI-mediated":[89],"musicking,":[90],"including":[91],"assimilation":[95],"accommodation,":[97],"metacognitive":[98],"reflection,":[99],"constructive":[101],"perception.":[102],"argues":[105],"models":[109,142,203],"function":[110],"quasi-objects":[112],"signification,":[115],"simultaneously":[116],"stabilizing":[117],"destabilizing":[119],"conventional":[120],"forms":[121,168],"while":[122],"fostering":[123],"new":[124],"modes":[125],"listening":[127],"aesthetic":[129],"reflexivity.Using":[130],"Udio":[131],"a":[133,175,212,223],"primary":[134],"case":[135],"study,":[136],"this":[137],"study":[138],"liminal":[145],"spaces":[146],"between":[147],"linguistic":[148],"sonic":[151],"outputs.":[152],"process":[154],"not":[155],"only":[156],"generates":[157],"novel":[158],"expressions":[160],"but":[161],"also":[162],"listeners":[164],"to":[165,204,221],"engage":[166],"critical":[170],"\"structurally-aware":[172],"listening.\",":[173],"encouraging":[174],"deeper":[176],"understanding":[177],"music's":[179],"structures,":[180],"nuances,":[182],"socio-cultural":[185],"contexts":[186],"shape":[188],"our":[189],"concludes":[194],"by":[195],"reflecting":[196],"on":[197],"potential":[199],"serve":[205],"epistemic":[207],"tools":[208],"quasi-objects,":[210],"facilitating":[211],"significant":[213],"shift":[214],"interactions":[217],"inviting":[219],"users":[220],"develop":[222],"more":[224],"comprehension":[226],"cultural":[231],"foundations":[232],"music.":[234]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-25T00:00:00"}
