{"id":"https://openalex.org/W7127064384","doi":"https://doi.org/10.1145/3787256.3787277","title":"Comparative Analysis of Sentence Transformers for Reference Paper Collection in Five Academic Fields","display_name":"Comparative Analysis of Sentence Transformers for Reference Paper Collection in Five Academic Fields","publication_year":2025,"publication_date":"2025-11-21","ids":{"openalex":"https://openalex.org/W7127064384","doi":"https://doi.org/10.1145/3787256.3787277"},"language":null,"primary_location":{"id":"doi:10.1145/3787256.3787277","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3787256.3787277","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 8th International Conference on Computational Intelligence and Intelligent Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3787256.3787277","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027897953","display_name":"Tresna Maulana Fahrudin","orcid":"https://orcid.org/0000-0002-9895-2442"},"institutions":[{"id":"https://openalex.org/I163770644","display_name":"Okayama University","ror":"https://ror.org/02pc6pc55","country_code":"JP","type":"education","lineage":["https://openalex.org/I163770644"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Tresna Maulana Fahrudin","raw_affiliation_strings":["Department of Information and Communication Systems, Okayama University, Okayama, Japan"],"raw_orcid":"https://orcid.org/0000-0002-9895-2442","affiliations":[{"raw_affiliation_string":"Department of Information and Communication Systems, Okayama University, Okayama, Japan","institution_ids":["https://openalex.org/I163770644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124781784","display_name":"Nobuo Funabiki","orcid":null},"institutions":[{"id":"https://openalex.org/I163770644","display_name":"Okayama University","ror":"https://ror.org/02pc6pc55","country_code":"JP","type":"education","lineage":["https://openalex.org/I163770644"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Nobuo Funabiki","raw_affiliation_strings":["Department of Information and Communication Systems, Okayama University, Okayama, Japan"],"raw_orcid":"https://orcid.org/0000-0003-3234-3473","affiliations":[{"raw_affiliation_string":"Department of Information and Communication Systems, Okayama University, Okayama, Japan","institution_ids":["https://openalex.org/I163770644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008159036","display_name":"Komang Candra Brata","orcid":"https://orcid.org/0000-0003-2896-6686"},"institutions":[{"id":"https://openalex.org/I163770644","display_name":"Okayama University","ror":"https://ror.org/02pc6pc55","country_code":"JP","type":"education","lineage":["https://openalex.org/I163770644"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Komang Candra Brata","raw_affiliation_strings":["Department of Information and Communication Systems, Okayama University, Okayama, Japan"],"raw_orcid":"https://orcid.org/0000-0003-2896-6686","affiliations":[{"raw_affiliation_string":"Department of Information and Communication Systems, Okayama University, Okayama, Japan","institution_ids":["https://openalex.org/I163770644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046889564","display_name":"Noprianto Noprianto","orcid":"https://orcid.org/0000-0003-1046-3992"},"institutions":[{"id":"https://openalex.org/I163770644","display_name":"Okayama University","ror":"https://ror.org/02pc6pc55","country_code":"JP","type":"education","lineage":["https://openalex.org/I163770644"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Noprianto Noprianto","raw_affiliation_strings":["Department of Information and Communication Systems, Okayama University, Okayama, Japan"],"raw_orcid":"https://orcid.org/0000-0003-1046-3992","affiliations":[{"raw_affiliation_string":"Department of Information and Communication Systems, Okayama University, Okayama, Japan","institution_ids":["https://openalex.org/I163770644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124813737","display_name":"Amri Muhaimin","orcid":null},"institutions":[{"id":"https://openalex.org/I3130997290","display_name":"University of Pembangunan Nasional Veteran Jawa Timur","ror":"https://ror.org/05sbm1c04","country_code":"ID","type":"education","lineage":["https://openalex.org/I3130997290"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Amri Muhaimin","raw_affiliation_strings":["Department of Data Science, Universitas Pembangunan Nasional Veteran Jawa Timur, Surabaya, Indonesia"],"raw_orcid":"https://orcid.org/0009-0004-4161-8277","affiliations":[{"raw_affiliation_string":"Department of Data Science, Universitas Pembangunan Nasional Veteran Jawa Timur, Surabaya, Indonesia","institution_ids":["https://openalex.org/I3130997290"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124775919","display_name":"Kartika Maulida Hindrayani","orcid":null},"institutions":[{"id":"https://openalex.org/I3130997290","display_name":"University of Pembangunan Nasional Veteran Jawa Timur","ror":"https://ror.org/05sbm1c04","country_code":"ID","type":"education","lineage":["https://openalex.org/I3130997290"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Kartika Maulida Hindrayani","raw_affiliation_strings":["Department of Data Science, Universitas Pembangunan Nasional Veteran Jawa Timur, Surabaya, Indonesia"],"raw_orcid":"https://orcid.org/0009-0003-9755-0657","affiliations":[{"raw_affiliation_string":"Department of Data Science, Universitas Pembangunan Nasional Veteran Jawa Timur, Surabaya, Indonesia","institution_ids":["https://openalex.org/I3130997290"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5027897953"],"corresponding_institution_ids":["https://openalex.org/I163770644"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.81346549,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"139","last_page":"144"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.6417999863624573,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.6417999863624573,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.09769999980926514,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.041099999099969864,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.6884999871253967},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6603999733924866},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.49219998717308044},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.4253000020980835},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4207000136375427},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.4036000072956085},{"id":"https://openalex.org/keywords/semantic-search","display_name":"Semantic search","score":0.3806999921798706},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.36000001430511475},{"id":"https://openalex.org/keywords/reference-model","display_name":"Reference model","score":0.34700000286102295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7688000202178955},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6884999871253967},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6603999733924866},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5978999733924866},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.49219998717308044},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48420000076293945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4456000030040741},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.4253000020980835},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4207000136375427},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.4036000072956085},{"id":"https://openalex.org/C166423231","wikidata":"https://www.wikidata.org/wiki/Q1891170","display_name":"Semantic search","level":3,"score":0.3806999921798706},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.36000001430511475},{"id":"https://openalex.org/C150189527","wikidata":"https://www.wikidata.org/wiki/Q356674","display_name":"Reference model","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.3287000060081482},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.3264000117778778},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32330000400543213},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.3215000033378601},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.2912999987602234},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.2870999872684479},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.26179999113082886},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.2554999887943268},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3787256.3787277","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3787256.3787277","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 8th International Conference on Computational Intelligence and Intelligent Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3787256.3787277","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3787256.3787277","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 8th International Conference on Computational Intelligence and Intelligent Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.6750365495681763,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2073728848","https://openalex.org/W2904769620","https://openalex.org/W2964523010","https://openalex.org/W3023758415","https://openalex.org/W3203912530","https://openalex.org/W4229045617","https://openalex.org/W4313523485","https://openalex.org/W4383678258","https://openalex.org/W4386730264","https://openalex.org/W4391133530","https://openalex.org/W4408408253","https://openalex.org/W4409888796"],"related_works":[],"abstract_inverted_index":{"Nowadays,":[0],"general-purpose":[1],"literature":[2],"search":[3],"engines":[4],"like":[5],"Google":[6],"Scholar":[7],"are":[8,56],"commonly":[9],"used":[10],"to":[11,63],"find":[12],"reference":[13,59,66,169],"papers":[14],"by":[15],"scholars.":[16],"Although":[17],"they":[18],"perform":[19,150],"well":[20,151],"in":[21,31,35,42,87,144,152,167,175,183],"a":[22,58,105],"particular":[23],"discipline,":[24],"users":[25],"may":[26],"face":[27],"difficulties":[28],"maintaining":[29],"relevance":[30],"others.":[32],"The":[33,137],"limitation":[34],"handling":[36],"queries":[37,90],"containing":[38],"domain-specific":[39,153],"vocabulary,":[40],"struggles":[41],"capturing":[43],"the":[44,49,156],"topic\u2019s":[45],"semantic":[46,73,161],"context,":[47],"and":[48,77,94,117,131,164],"matching":[50],"techniques":[51],"present":[52],"challenges.":[53],"Currently,":[54],"we":[55,103],"developing":[57],"paper":[60,170],"collection":[61,171],"system":[62],"accelerate":[64],"academic":[65,121,146,168],"searches":[67],"through":[68],"integrating":[69],"multiple":[70],"database":[71],"API,":[72],"sentence":[74,109],"embedding":[75,98],"models,":[76],"web":[78],"scraping":[79],"technology.":[80],"However,":[81],"our":[82,184],"prior":[83],"evaluations":[84],"were":[85,180],"limited":[86],"using":[88],"predefined":[89],"under":[91],"controlled":[92],"environments":[93],"relying":[95],"on":[96],"lightweight":[97],"models.":[99],"In":[100],"this":[101],"paper,":[102],"conduct":[104],"comparative":[106],"analysis":[107],"of":[108],"transformer":[110],"models":[111,142,179],"including":[112],"all-MiniLM-L6-v1,":[113],"all-DistilRoBERTa-v1,":[114],"all-mpnet-base-v2,":[115],"SciBERT,":[116],"SPECTER":[118],"across":[119,178],"five":[120],"fields":[122],"with":[123],"user-defined":[124],"queries.":[125],"We":[126],"adopt":[127],"precision@10,":[128],"NDCG@10,":[129],"accessibility@10,":[130],"response":[132],"time":[133,165],"for":[134],"evaluation":[135],"metrics.":[136],"results":[138],"show":[139],"that":[140],"some":[141],"excel":[143],"all":[145],"fields,":[147],"while":[148],"others":[149],"contexts,":[154],"highlighting":[155],"optimal":[157],"trade-off":[158],"between":[159],"relevance,":[160],"domain":[162],"understanding,":[163],"efficiency":[166],"systems.":[172],"Significant":[173],"differences":[174],"performance":[176],"metrics":[177],"confirmed":[181],"statistically":[182],"experiments.":[185]},"counts_by_year":[],"updated_date":"2026-02-06T02:01:19.302388","created_date":"2026-02-03T00:00:00"}
