{"id":"https://openalex.org/W4379519265","doi":"https://doi.org/10.1017/s1351324923000165","title":"Focusing on potential named entities during active label acquisition","display_name":"Focusing on potential named entities during active label acquisition","publication_year":2023,"publication_date":"2023-06-06","ids":{"openalex":"https://openalex.org/W4379519265","doi":"https://doi.org/10.1017/s1351324923000165"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324923000165","is_oa":true,"landing_page_url":"https://doi.org/10.1017/s1351324923000165","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/087DF41DC645A49AA712D55D486405DD/S1351324923000165a.pdf/div-class-title-focusing-on-potential-named-entities-during-active-label-acquisition-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/087DF41DC645A49AA712D55D486405DD/S1351324923000165a.pdf/div-class-title-focusing-on-potential-named-entities-during-active-label-acquisition-div.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071697234","display_name":"Ali Osman Berk \u015eapc\u0131","orcid":"https://orcid.org/0000-0003-4396-817X"},"institutions":[{"id":"https://openalex.org/I134235054","display_name":"Sabanc\u0131 \u00dcniversitesi","ror":"https://ror.org/049asqa32","country_code":"TR","type":"education","lineage":["https://openalex.org/I134235054"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Ali Osman Berk \u015eapc\u0131","raw_affiliation_strings":["Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I134235054"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092098096","display_name":"Hasan Kemik","orcid":null},"institutions":[{"id":"https://openalex.org/I134235054","display_name":"Sabanc\u0131 \u00dcniversitesi","ror":"https://ror.org/049asqa32","country_code":"TR","type":"education","lineage":["https://openalex.org/I134235054"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Hasan Kemik","raw_affiliation_strings":["Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I134235054"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035084467","display_name":"Reyyan Yeniterzi","orcid":"https://orcid.org/0000-0002-8501-6209"},"institutions":[{"id":"https://openalex.org/I134235054","display_name":"Sabanc\u0131 \u00dcniversitesi","ror":"https://ror.org/049asqa32","country_code":"TR","type":"education","lineage":["https://openalex.org/I134235054"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Reyyan Yeniterzi","raw_affiliation_strings":["Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-8501-6209","affiliations":[{"raw_affiliation_string":"Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I134235054"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051657734","display_name":"\u00d6znur Ta\u015ftan","orcid":"https://orcid.org/0000-0001-7058-5372"},"institutions":[{"id":"https://openalex.org/I134235054","display_name":"Sabanc\u0131 \u00dcniversitesi","ror":"https://ror.org/049asqa32","country_code":"TR","type":"education","lineage":["https://openalex.org/I134235054"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Oznur Tastan","raw_affiliation_strings":["Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey"],"raw_orcid":"https://orcid.org/0000-0001-7058-5372","affiliations":[{"raw_affiliation_string":"Faculty of Engineering and Natural Sciences, Sabanc\u0131 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I134235054"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5035084467","https://openalex.org/A5051657734"],"corresponding_institution_ids":["https://openalex.org/I134235054"],"apc_list":null,"apc_paid":null,"fwci":0.852,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.78105123,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"30","issue":"3","first_page":"602","last_page":"624"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9296239018440247},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.8318626880645752},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6279723644256592},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.5915743708610535},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5867809057235718},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5643141865730286},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5532485842704773},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.5373960733413696},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5061144232749939},{"id":"https://openalex.org/keywords/named-entity","display_name":"Named entity","score":0.4162186086177826},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3950806260108948},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.17619794607162476}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9296239018440247},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.8318626880645752},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6279723644256592},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.5915743708610535},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5867809057235718},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5643141865730286},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5532485842704773},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.5373960733413696},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5061144232749939},{"id":"https://openalex.org/C2777889803","wikidata":"https://www.wikidata.org/wiki/Q25047676","display_name":"Named entity","level":2,"score":0.4162186086177826},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3950806260108948},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.17619794607162476},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1017/s1351324923000165","is_oa":true,"landing_page_url":"https://doi.org/10.1017/s1351324923000165","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/087DF41DC645A49AA712D55D486405DD/S1351324923000165a.pdf/div-class-title-focusing-on-potential-named-entities-during-active-label-acquisition-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},{"id":"pmh:oai:research.sabanciuniv.edu:47404","is_oa":false,"landing_page_url":"https://research.sabanciuniv.edu/id/eprint/47404/","pdf_url":null,"source":{"id":"https://openalex.org/S4306402254","display_name":"Sabanci University","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I134235054","host_organization_name":"Sabanc\u0131 \u00dcniversitesi","host_organization_lineage":["https://openalex.org/I134235054"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":{"id":"doi:10.1017/s1351324923000165","is_oa":true,"landing_page_url":"https://doi.org/10.1017/s1351324923000165","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/087DF41DC645A49AA712D55D486405DD/S1351324923000165a.pdf/div-class-title-focusing-on-potential-named-entities-during-active-label-acquisition-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6600000262260437,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4379519265.pdf"},"referenced_works_count":52,"referenced_works":["https://openalex.org/W52840134","https://openalex.org/W151377110","https://openalex.org/W1513874326","https://openalex.org/W1580375566","https://openalex.org/W1956471287","https://openalex.org/W1995875735","https://openalex.org/W2010588484","https://openalex.org/W2051434435","https://openalex.org/W2055617685","https://openalex.org/W2074064986","https://openalex.org/W2095729244","https://openalex.org/W2113152670","https://openalex.org/W2114663556","https://openalex.org/W2117763124","https://openalex.org/W2126716476","https://openalex.org/W2132038179","https://openalex.org/W2135459176","https://openalex.org/W2144182447","https://openalex.org/W2144452292","https://openalex.org/W2144578941","https://openalex.org/W2147880316","https://openalex.org/W2154250549","https://openalex.org/W2169099542","https://openalex.org/W2171671120","https://openalex.org/W2180566385","https://openalex.org/W2252069213","https://openalex.org/W2294798173","https://openalex.org/W2346452181","https://openalex.org/W2509700522","https://openalex.org/W2785787385","https://openalex.org/W2786672974","https://openalex.org/W2896457183","https://openalex.org/W2911489562","https://openalex.org/W2963716420","https://openalex.org/W2965373594","https://openalex.org/W2970352191","https://openalex.org/W2976444281","https://openalex.org/W2999905431","https://openalex.org/W3009431628","https://openalex.org/W3035858791","https://openalex.org/W3098466758","https://openalex.org/W3197209004","https://openalex.org/W4206797693","https://openalex.org/W4288089799","https://openalex.org/W6606205340","https://openalex.org/W6675206559","https://openalex.org/W6682578415","https://openalex.org/W6686604339","https://openalex.org/W6756615331","https://openalex.org/W6769627184","https://openalex.org/W6774952039","https://openalex.org/W6793751678"],"related_works":["https://openalex.org/W2032007337","https://openalex.org/W2793132289","https://openalex.org/W2186562580","https://openalex.org/W2155874911","https://openalex.org/W1884363728","https://openalex.org/W2916255597","https://openalex.org/W4386977977","https://openalex.org/W4253099099","https://openalex.org/W3035097673","https://openalex.org/W3022333975"],"abstract_inverted_index":{"Abstract":[0],"Named":[1],"entity":[2,22],"recognition":[3],"(NER)":[4],"aims":[5],"to":[6,31,68,107,132],"identify":[7],"mentions":[8],"of":[9,48,83,158],"named":[10,21],"entities":[11],"in":[12,36,87],"an":[13],"unstructured":[14],"text":[15],"and":[16,111,119],"classify":[17],"them":[18],"into":[19],"predefined":[20],"classes.":[23],"While":[24],"deep":[25],"learning-based":[26],"pre-trained":[27],"language":[28],"models":[29],"help":[30],"achieve":[32],"good":[33],"predictive":[34],"performances":[35],"NER,":[37],"many":[38],"domain-specific":[39],"NER":[40,66],"applications":[41],"still":[42],"call":[43],"for":[44,57,65,93],"a":[45,54,127],"substantial":[46],"amount":[47],"labeled":[49],"data.":[50],"Active":[51],"learning":[52],"(AL),":[53],"general":[55],"framework":[56],"the":[58,70,78,152,156],"label":[59],"acquisition":[60],"problem,":[61],"has":[62],"been":[63],"used":[64],"tasks":[67],"minimize":[69],"annotation":[71],"cost":[72,121],"without":[73],"sacrificing":[74],"model":[75],"performance.":[76],"However,":[77],"heavily":[79],"imbalanced":[80],"class":[81],"distribution":[82],"tokens":[84,110,160],"introduces":[85],"challenges":[86],"designing":[88],"effective":[89],"AL":[90,98],"querying":[91],"methods":[92],"NER.":[94],"We":[95,124],"propose":[96,126],"several":[97],"sentence":[99],"query":[100],"evaluation":[101,122],"functions":[102,115],"that":[103,135,151],"pay":[104],"more":[105],"attention":[106],"potential":[108],"positive":[109],"evaluate":[112],"these":[113],"proposed":[114,153],"with":[116,168],"both":[117],"sentence-based":[118],"token-based":[120],"strategies.":[123],"also":[125],"better":[128,163],"data-driven":[129],"normalization":[130],"approach":[131,154],"penalize":[133],"sentences":[134],"are":[136],"too":[137,140],"long":[138],"or":[139,164],"short.":[141],"Our":[142],"experiments":[143],"on":[144],"three":[145],"datasets":[146],"from":[147],"different":[148],"domains":[149],"reveal":[150],"reduces":[155],"number":[157],"annotated":[159],"while":[161],"achieving":[162],"comparable":[165],"prediction":[166],"performance":[167],"conventional":[169],"methods.":[170]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-01-25T23:04:38.658462","created_date":"2023-06-07T00:00:00"}
