{"id":"https://openalex.org/W4416057134","doi":"https://doi.org/10.48550/arxiv.2510.18799","title":"FeClustRE: Hierarchical Clustering and Semantic Tagging of App Features from User Reviews","display_name":"FeClustRE: Hierarchical Clustering and Semantic Tagging of App Features from User Reviews","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4416057134","doi":"https://doi.org/10.48550/arxiv.2510.18799"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2510.18799","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.18799","pdf_url":"https://arxiv.org/pdf/2510.18799","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.18799","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119925020","display_name":"Max Tiessler","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tiessler, Max","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5060562561","display_name":"Quim Motger","orcid":"https://orcid.org/0000-0002-4896-7515"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Motger, Quim","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5119925020"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.23929999768733978,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.23929999768733978,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.15860000252723694,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.09529999643564224,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.595300018787384},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.5899999737739563},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.5569999814033508},{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.5299999713897705},{"id":"https://openalex.org/keywords/taxonomy","display_name":"Taxonomy (biology)","score":0.5194000005722046},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.4659000039100647},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4629000127315521},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4438999891281128},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4307999908924103}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8747000098228455},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.595300018787384},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.5899999737739563},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.5569999814033508},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5307000279426575},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.5299999713897705},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.5194000005722046},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.4659000039100647},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4629000127315521},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4438999891281128},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4307999908924103},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4291999936103821},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.3993000090122223},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.38339999318122864},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.3698999881744385},{"id":"https://openalex.org/C193125573","wikidata":"https://www.wikidata.org/wiki/Q7449065","display_name":"Semantic interpretation","level":2,"score":0.35690000653266907},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C177937566","wikidata":"https://www.wikidata.org/wiki/Q4223102","display_name":"Document clustering","level":3,"score":0.3163999915122986},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.314300000667572},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.3140999972820282},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.3091999888420105},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2831999957561493},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2603999972343445}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2510.18799","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.18799","pdf_url":"https://arxiv.org/pdf/2510.18799","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2510.18799","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.18799","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.18799","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.18799","pdf_url":"https://arxiv.org/pdf/2510.18799","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"[Context":[0],"and":[1,65,93,118,133,148,164,177,189,192,200,208],"motivation.]":[2],"Extracting":[3],"features":[4,44,59,130],"from":[5],"mobile":[6],"app":[7,79,157],"reviews":[8,158],"is":[9],"increasingly":[10],"important":[11],"for":[12,145,159,174],"multiple":[13],"requirements":[14],"engineering":[15],"(RE)":[16],"tasks.":[17],"However,":[18],"existing":[19,53],"methods":[20,54],"struggle":[21],"to":[22,47],"turn":[23],"noisy,":[24],"ambiguous":[25],"feedback":[26,199],"into":[27,131,206],"interpretable":[28],"insights.":[29],"[Question/problem.]":[30],"Syntactic":[31],"approaches":[32,71],"lack":[33],"semantic":[34,61,120,162],"depth,":[35],"while":[36],"large":[37],"language":[38],"models":[39],"(LLMs)":[40],"often":[41],"miss":[42],"fine-grained":[43],"or":[45],"fail":[46],"structure":[48],"them":[49],"coherently.":[50],"In":[51,102],"addition,":[52],"output":[55],"flat":[56],"lists":[57],"of":[58,78,153],"without":[60],"organization,":[62],"limiting":[63],"interpretation":[64],"comparability.":[66],"Consequently,":[67],"current":[68,207],"feature":[69,112,175,201],"extraction":[70,146,176],"do":[72],"not":[73],"provide":[74],"structured,":[75],"meaningful":[76,136],"representations":[77],"features.":[80],"As":[81],"a":[82,108,150,171,185],"result,":[83],"practitioners":[84],"face":[85],"fragmented":[86],"information":[87],"that":[88],"hinder":[89],"requirement":[90],"analysis,":[91],"prioritization,":[92],"cross-app":[94],"comparison,":[95],"among":[96],"other":[97],"use":[98],"cases.":[99],"[Principal":[100],"ideas/results.]":[101],"this":[103],"context,":[104],"we":[105],"propose":[106],"FeClustRE,":[107],"framework":[109,173],"integrating":[110],"hybrid":[111,172],"extraction,":[113],"hierarchical":[114],"clustering":[115,160],"with":[116,126,184],"auto-tuning":[117,182],"LLM-based":[119],"labelling.":[121],"FeClustRE":[122,141,168],"combines":[123],"syntactic":[124],"parsing":[125],"LLM":[127],"enrichment,":[128],"organizes":[129],"clusters,":[132],"automatically":[134],"generates":[135],"taxonomy":[137,178],"labels.":[138],"We":[139],"evaluate":[140],"on":[142,149],"public":[143],"benchmarks":[144],"correctness":[147],"sample":[151],"study":[152],"generative":[154],"AI":[155],"assistant":[156],"quality,":[161],"coherence,":[163],"interpretability.":[165],"[Contribution.]":[166],"Overall,":[167],"delivers":[169],"(1)":[170],"generation,":[179],"(2)":[180],"an":[181],"mechanism":[183],"comprehensive":[186],"evaluation":[187],"methodology,":[188],"(3)":[190],"open-source":[191],"replicable":[193],"implementation.":[194],"These":[195],"contributions":[196],"bridge":[197],"user":[198],"understanding,":[202],"enabling":[203],"deeper":[204],"insights":[205],"emerging":[209],"requirements.":[210]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-24T00:00:00"}
