{"id":"https://openalex.org/W4408062540","doi":"https://doi.org/10.5220/0013155300003890","title":"ABBIE: Attention-Based BI-Encoders for Predicting Where to Split Compound Sanskrit Words","display_name":"ABBIE: Attention-Based BI-Encoders for Predicting Where to Split Compound Sanskrit Words","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4408062540","doi":"https://doi.org/10.5220/0013155300003890"},"language":"en","primary_location":{"id":"doi:10.5220/0013155300003890","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0013155300003890","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th International Conference on Agents and Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0013155300003890","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101629306","display_name":"Irfan Ali","orcid":"https://orcid.org/0000-0002-3765-3107"},"institutions":[{"id":"https://openalex.org/I900890020","display_name":"University of Palermo","ror":"https://ror.org/044k9ta02","country_code":"IT","type":"education","lineage":["https://openalex.org/I900890020"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Irfan Ali","raw_affiliation_strings":["Department of Engineering, University of Palermo, Palermo, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Palermo, Palermo, Italy","institution_ids":["https://openalex.org/I900890020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056795735","display_name":"Liliana Lo Presti","orcid":"https://orcid.org/0000-0003-0833-4403"},"institutions":[{"id":"https://openalex.org/I900890020","display_name":"University of Palermo","ror":"https://ror.org/044k9ta02","country_code":"IT","type":"education","lineage":["https://openalex.org/I900890020"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Liliana Lo Presti","raw_affiliation_strings":["Department of Engineering, University of Palermo, Palermo, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Palermo, Palermo, Italy","institution_ids":["https://openalex.org/I900890020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092915338","display_name":"Igor Span\u00f2","orcid":"https://orcid.org/0000-0003-0304-0764"},"institutions":[{"id":"https://openalex.org/I900890020","display_name":"University of Palermo","ror":"https://ror.org/044k9ta02","country_code":"IT","type":"education","lineage":["https://openalex.org/I900890020"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Igor Spano","raw_affiliation_strings":["Department of Cultures and Society, University of Palermo, Palermo, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Cultures and Society, University of Palermo, Palermo, Italy","institution_ids":["https://openalex.org/I900890020"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001373862","display_name":"Marco La Cascia","orcid":"https://orcid.org/0000-0002-8766-6395"},"institutions":[{"id":"https://openalex.org/I900890020","display_name":"University of Palermo","ror":"https://ror.org/044k9ta02","country_code":"IT","type":"education","lineage":["https://openalex.org/I900890020"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco La Cascia","raw_affiliation_strings":["Department of Engineering, University of Palermo, Palermo, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Palermo, Palermo, Italy","institution_ids":["https://openalex.org/I900890020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101629306"],"corresponding_institution_ids":["https://openalex.org/I900890020"],"apc_list":null,"apc_paid":null,"fwci":2.8599,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89681223,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"334","last_page":"344"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9365000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9236999750137329,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sanskrit","display_name":"Sanskrit","score":0.8339062333106995},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5697532892227173},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5335348844528198},{"id":"https://openalex.org/keywords/compound","display_name":"Compound","score":0.5048432946205139},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45015352964401245},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4358515739440918},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3456764817237854},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2352047860622406},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.1501188576221466},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.059281736612319946}],"concepts":[{"id":"https://openalex.org/C29912816","wikidata":"https://www.wikidata.org/wiki/Q11059","display_name":"Sanskrit","level":2,"score":0.8339062333106995},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5697532892227173},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5335348844528198},{"id":"https://openalex.org/C2674912","wikidata":"https://www.wikidata.org/wiki/Q245423","display_name":"Compound","level":2,"score":0.5048432946205139},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45015352964401245},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4358515739440918},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3456764817237854},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2352047860622406},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.1501188576221466},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.059281736612319946}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0013155300003890","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0013155300003890","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th International Conference on Agents and Artificial Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:iris.unipa.it:10447/678963","is_oa":false,"landing_page_url":"https://hdl.handle.net/10447/678963","pdf_url":null,"source":{"id":"https://openalex.org/S4306401065","display_name":"Nova Science Publishers (Nova Science Publishers, Inc.)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/bookPart"}],"best_oa_location":{"id":"doi:10.5220/0013155300003890","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0013155300003890","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th International Conference on Agents and Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2802427415","https://openalex.org/W2620810496","https://openalex.org/W4210574062","https://openalex.org/W4206712636","https://openalex.org/W2064780833","https://openalex.org/W2315373242","https://openalex.org/W4382808597","https://openalex.org/W4385471946","https://openalex.org/W2068356829","https://openalex.org/W2357247495"],"abstract_inverted_index":{"Sanskrit":[0,17,80,186],"is":[1,18,38],"a":[2,35,49,59,69,130,135,175],"highly":[3],"composite":[4],"language,":[5],"morphologically":[6],"and":[7,68,92,114,188],"phonetically":[8],"complex.":[9],"One":[10],"of":[11,21,32,51,117,123,165,181,185,191],"the":[12,19,29,75,87,99,104,109,112,118,124,141,148,154,168,179,182,189],"major":[13],"challenges":[14],"in":[15,34,79,90,102,163],"processing":[16],"splitting":[20,105],"compound":[22,36,81,155],"words":[23],"that":[24,64,133,147],"are":[25,53,127],"merged":[26],"phonetically.":[27],"Recognizing":[28],"exact":[30],"location":[31,78],"splits":[33,43],"word":[37,156],"difficult":[39],"since":[40],"several":[41],"possible":[42],"can":[44],"be":[45,158],"found,":[46],"but":[47],"only":[48],"few":[50],"them":[52],"semantically":[54],"meaningful.":[55],"This":[56],"paper":[57,172],"proposes":[58,174],"novel":[60],"deep":[61],"learning":[62],"method":[63],"uses":[65],"two":[66,84],"bi-encoders":[67,85],"multi-head":[70],"attention":[71],"module":[72],"to":[73,139],"predict":[74],"valid":[76],"split":[77,159],"words.":[82],"The":[83,96,121,171],"process":[86],"input":[88],"sequence":[89],"direct":[91,113],"reverse":[93,115],"order":[94],"respectively.":[95],"model":[97,126,150],"learns":[98],"character-level":[100],"context":[101],"which":[103],"occurs":[106],"by":[107],"exploiting":[108],"correlation":[110],"between":[111],"dynamics":[116],"characters":[119],"sequence.":[120],"results":[122,145],"proposed":[125,149],"compared":[128],"with":[129],"stateof-the-art":[131],"technique":[132],"adopts":[134],"bidirectional":[136],"recurrent":[137],"network":[138],"solve":[140],"same":[142],"task.":[143],"Experimental":[144],"show":[146],"correctly":[151],"identifies":[152],"where":[153],"should":[157],"into":[160],"its":[161],"components":[162],"89.27%":[164],"cases,":[166],"outperforming":[167],"state-of-the-art":[169],"technique.":[170],"also":[173],"dataset":[176],"developed":[177],"from":[178],"repository":[180],"Digital":[183],"Corpus":[184],"(DCS)":[187],"University":[190],"Hyderabad":[192],"(UoH)":[193],"corpus.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
