{"id":"https://openalex.org/W2148282103","doi":"https://doi.org/10.3115/v1/p14-1104","title":"Active Learning with Efficient Feature Weighting Methods for Improving Data Quality and Classification Accuracy","display_name":"Active Learning with Efficient Feature Weighting Methods for Improving Data Quality and Classification Accuracy","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2148282103","doi":"https://doi.org/10.3115/v1/p14-1104","mag":"2148282103"},"language":"en","primary_location":{"id":"doi:10.3115/v1/p14-1104","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/p14-1104","pdf_url":"https://aclanthology.org/P14-1104.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/P14-1104.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050280503","display_name":"Justin Martineau","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Justin Martineau","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100605099","display_name":"Chen L\u00fc","orcid":"https://orcid.org/0000-0003-1927-2391"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109850197","display_name":"Doreen Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Doreen Cheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028772801","display_name":"Amit Sheth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amit Sheth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5050280503"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8456,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.82306961,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1104","last_page":"1112"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8169180154800415},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.773298978805542},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6005423069000244},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5842440724372864},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5778390169143677},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5688083171844482},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.518599271774292},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4902408719062805},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.49014124274253845},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4829823076725006},{"id":"https://openalex.org/keywords/learning-to-rank","display_name":"Learning to rank","score":0.4381108283996582},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4230392277240753},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.17372065782546997}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8169180154800415},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.773298978805542},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6005423069000244},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5842440724372864},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5778390169143677},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5688083171844482},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.518599271774292},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4902408719062805},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.49014124274253845},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4829823076725006},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.4381108283996582},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4230392277240753},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.17372065782546997},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.3115/v1/p14-1104","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/p14-1104","pdf_url":"https://aclanthology.org/P14-1104.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},{"id":"pmh:oai:corescholar.libraries.wright.edu:knoesis-1951","is_oa":true,"landing_page_url":"https://corescholar.libraries.wright.edu/knoesis/575","pdf_url":null,"source":{"id":"https://openalex.org/S2737205702","display_name":"Journal of Bioresource Management","issn_l":"2309-3854","issn":["2309-3854"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310316536","host_organization_name":"Bioresource Research Center (BRC), Islamabad","host_organization_lineage":["https://openalex.org/P4310316536"],"host_organization_lineage_names":["Bioresource Research Center (BRC), Islamabad"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Kno.e.sis Publications","raw_type":"text"},{"id":"pmh:oai:scholarcommons.sc.edu:aii_fac_pub-1105","is_oa":false,"landing_page_url":"https://scholarcommons.sc.edu/aii_fac_pub/105","pdf_url":null,"source":{"id":"https://openalex.org/S4306401386","display_name":"Scholar Commons (University of South Carolina)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I155781252","host_organization_name":"University of South Carolina","host_organization_lineage":["https://openalex.org/I155781252"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Publications","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.669.8525","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.669.8525","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://aclweb.org/anthology/P/P14/P14-1104.pdf","raw_type":"text"},{"id":"pmh:oai:works.bepress.com:amit_sheth-1204","is_oa":true,"landing_page_url":"https://works.bepress.com/amit_sheth/205","pdf_url":null,"source":{"id":"https://openalex.org/S2737205702","display_name":"Journal of Bioresource Management","issn_l":"2309-3854","issn":["2309-3854"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310316536","host_organization_name":"Bioresource Research Center (BRC), Islamabad","host_organization_lineage":["https://openalex.org/P4310316536"],"host_organization_lineage_names":["Bioresource Research Center (BRC), Islamabad"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Amit P. Sheth","raw_type":"text"}],"best_oa_location":{"id":"doi:10.3115/v1/p14-1104","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/p14-1104","pdf_url":"https://aclanthology.org/P14-1104.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W2148282103.pdf"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W1522454948","https://openalex.org/W1537489869","https://openalex.org/W1595276678","https://openalex.org/W1604329830","https://openalex.org/W1744114474","https://openalex.org/W1898031563","https://openalex.org/W1970381522","https://openalex.org/W1971222444","https://openalex.org/W2007417114","https://openalex.org/W2079899298","https://openalex.org/W2088517004","https://openalex.org/W2091084672","https://openalex.org/W2092804630","https://openalex.org/W2098933520","https://openalex.org/W2118585731","https://openalex.org/W2120196261","https://openalex.org/W2125943921","https://openalex.org/W2135731857","https://openalex.org/W2143539737","https://openalex.org/W2151401338","https://openalex.org/W2172059508","https://openalex.org/W2903158431","https://openalex.org/W3100570787"],"related_works":["https://openalex.org/W2180954594","https://openalex.org/W2361861616","https://openalex.org/W2052835778","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2049003611","https://openalex.org/W2127804977","https://openalex.org/W2108418243","https://openalex.org/W2218034408","https://openalex.org/W2392921965"],"abstract_inverted_index":{"Many":[0],"machine":[1],"learning":[2],"datasets":[3],"are":[4],"noisy":[5],"with":[6],"a":[7,24,49,98],"substantial":[8],"number":[9],"of":[10,101],"mislabeled":[11,64],"instances.":[12],"This":[13],"noise":[14],"yields":[15],"sub-optimal":[16],"classification":[17],"performance.":[18],"In":[19],"this":[20],"paper":[21],"we":[22],"study":[23],"large,":[25],"low":[26,72],"quality":[27,70],"annotated":[28],"dataset,":[29],"created":[30],"quickly":[31],"and":[32,48,61],"cheaply":[33],"using":[34],"Amazon":[35],"Mechanical":[36],"Turk":[37],"to":[38,59,66],"crowdsource":[39],"annotations.":[40],"We":[41],"describe":[42],"computationally":[43,92],"cheap":[44],"feature":[45],"weighting":[46],"techniques":[47,96],"novel":[50],"non-linear":[51],"distribution":[52],"spreading":[53],"algorithm":[54],"that":[55,83],"can":[56],"be":[57],"used":[58],"iteratively":[60],"interactively":[62],"correcting":[63],"instances":[65],"significantly":[67],"improve":[68],"annotation":[69],"at":[71],"cost.":[73],"Eight":[74],"different":[75],"emotion":[76],"extraction":[77],"experiments":[78],"on":[79],"Twitter":[80],"data":[81],"demonstrate":[82],"our":[84],"approach":[85],"is":[86],"just":[87],"as":[88,90],"effective":[89],"more":[91],"expensive":[93],"techniques.":[94],"Our":[95],"save":[97],"considerable":[99],"amount":[100],"time.":[102]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2026-05-22T09:01:20.584952","created_date":"2025-10-10T00:00:00"}
