{"id":"https://openalex.org/W4221099399","doi":"https://doi.org/10.1109/tr.2022.3156126","title":"Construction and Evaluation of a High-Quality Corpus for Legal Intelligence Using Semiautomated Approaches","display_name":"Construction and Evaluation of a High-Quality Corpus for Legal Intelligence Using Semiautomated Approaches","publication_year":2022,"publication_date":"2022-03-25","ids":{"openalex":"https://openalex.org/W4221099399","doi":"https://doi.org/10.1109/tr.2022.3156126"},"language":"en","primary_location":{"id":"doi:10.1109/tr.2022.3156126","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tr.2022.3156126","pdf_url":null,"source":{"id":"https://openalex.org/S87725633","display_name":"IEEE Transactions on Reliability","issn_l":"0018-9529","issn":["0018-9529","1558-1721"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Reliability","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/6862510","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100670005","display_name":"Haihua Chen","orcid":"https://orcid.org/0000-0002-7088-9752"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Haihua Chen","raw_affiliation_strings":["Department of Information Science, University of North Texas, Denton, TX, USA"],"raw_orcid":"https://orcid.org/0000-0002-7088-9752","affiliations":[{"raw_affiliation_string":"Department of Information Science, University of North Texas, Denton, TX, USA","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080569966","display_name":"Lavinia F. Pieptea","orcid":null},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lavinia F. Pieptea","raw_affiliation_strings":["Department of Mathematics, University of North Texas, Denton, TX, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mathematics, University of North Texas, Denton, TX, USA","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049161723","display_name":"Junhua Ding","orcid":"https://orcid.org/0000-0002-9394-6748"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Junhua Ding","raw_affiliation_strings":["Department of Information Science, University of North Texas, Denton, TX, USA"],"raw_orcid":"https://orcid.org/0000-0002-9394-6748","affiliations":[{"raw_affiliation_string":"Department of Information Science, University of North Texas, Denton, TX, USA","institution_ids":["https://openalex.org/I123534392"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100670005"],"corresponding_institution_ids":["https://openalex.org/I123534392"],"apc_list":null,"apc_paid":null,"fwci":4.0232,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.94379888,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"71","issue":"2","first_page":"657","last_page":"673"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9617999792098999,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7961092591285706},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.7399560213088989},{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.7036629915237427},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6864355206489563},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6717982292175293},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6113262176513672},{"id":"https://openalex.org/keywords/generative-adversarial-network","display_name":"Generative adversarial network","score":0.4426153302192688},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4418877363204956},{"id":"https://openalex.org/keywords/semi-supervised-learning","display_name":"Semi-supervised learning","score":0.4233127534389496},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3696136772632599},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3581136465072632},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.09084618091583252}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7961092591285706},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.7399560213088989},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.7036629915237427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6864355206489563},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6717982292175293},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6113262176513672},{"id":"https://openalex.org/C2988773926","wikidata":"https://www.wikidata.org/wiki/Q25104379","display_name":"Generative adversarial network","level":3,"score":0.4426153302192688},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4418877363204956},{"id":"https://openalex.org/C58973888","wikidata":"https://www.wikidata.org/wiki/Q1041418","display_name":"Semi-supervised learning","level":2,"score":0.4233127534389496},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3696136772632599},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3581136465072632},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.09084618091583252},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tr.2022.3156126","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tr.2022.3156126","pdf_url":null,"source":{"id":"https://openalex.org/S87725633","display_name":"IEEE Transactions on Reliability","issn_l":"0018-9529","issn":["0018-9529","1558-1721"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Reliability","raw_type":"journal-article"},{"id":"pmh:oai:zenodo.org:6862510","is_oa":true,"landing_page_url":"https://zenodo.org/record/6862510","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:6862510","is_oa":true,"landing_page_url":"https://zenodo.org/record/6862510","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"score":0.4099999964237213,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":111,"referenced_works":["https://openalex.org/W1501234159","https://openalex.org/W1977155386","https://openalex.org/W2001800999","https://openalex.org/W2026568525","https://openalex.org/W2029851691","https://openalex.org/W2031921586","https://openalex.org/W2044405664","https://openalex.org/W2061702164","https://openalex.org/W2078268845","https://openalex.org/W2097089247","https://openalex.org/W2104540263","https://openalex.org/W2111700528","https://openalex.org/W2119707623","https://openalex.org/W2134510195","https://openalex.org/W2144232471","https://openalex.org/W2153804780","https://openalex.org/W2158880898","https://openalex.org/W2346248621","https://openalex.org/W2401483332","https://openalex.org/W2593597018","https://openalex.org/W2594110573","https://openalex.org/W2747264013","https://openalex.org/W2768348081","https://openalex.org/W2805389643","https://openalex.org/W2807243245","https://openalex.org/W2842153692","https://openalex.org/W2854210280","https://openalex.org/W2893709526","https://openalex.org/W2896457183","https://openalex.org/W2900611605","https://openalex.org/W2911329389","https://openalex.org/W2912804155","https://openalex.org/W2920714840","https://openalex.org/W2946595616","https://openalex.org/W2962854673","https://openalex.org/W2963373786","https://openalex.org/W2963594477","https://openalex.org/W2964745622","https://openalex.org/W2965006690","https://openalex.org/W2966518071","https://openalex.org/W2966808454","https://openalex.org/W2970923431","https://openalex.org/W2971296908","https://openalex.org/W2971644666","https://openalex.org/W2972905031","https://openalex.org/W2975583675","https://openalex.org/W2976295868","https://openalex.org/W2979666134","https://openalex.org/W2984353870","https://openalex.org/W2985169259","https://openalex.org/W2987088247","https://openalex.org/W2998768810","https://openalex.org/W3006296400","https://openalex.org/W3006787827","https://openalex.org/W3022807652","https://openalex.org/W3034942609","https://openalex.org/W3035308065","https://openalex.org/W3035454789","https://openalex.org/W3035668167","https://openalex.org/W3037647403","https://openalex.org/W3041123495","https://openalex.org/W3041133507","https://openalex.org/W3046441874","https://openalex.org/W3076947077","https://openalex.org/W3091431885","https://openalex.org/W3096580779","https://openalex.org/W3100124407","https://openalex.org/W3101273072","https://openalex.org/W3104548400","https://openalex.org/W3118813946","https://openalex.org/W3130113475","https://openalex.org/W3130347092","https://openalex.org/W3135190223","https://openalex.org/W3155088253","https://openalex.org/W3156333129","https://openalex.org/W3157799840","https://openalex.org/W3159579291","https://openalex.org/W3160574899","https://openalex.org/W3174828871","https://openalex.org/W3186492090","https://openalex.org/W3199064974","https://openalex.org/W4287633338","https://openalex.org/W4287796293","https://openalex.org/W4292779060","https://openalex.org/W4294214983","https://openalex.org/W4320013936","https://openalex.org/W6677773858","https://openalex.org/W6682780409","https://openalex.org/W6712805847","https://openalex.org/W6718379498","https://openalex.org/W6742720488","https://openalex.org/W6745609711","https://openalex.org/W6752735244","https://openalex.org/W6752763621","https://openalex.org/W6754920418","https://openalex.org/W6755207826","https://openalex.org/W6763088532","https://openalex.org/W6766137252","https://openalex.org/W6766602542","https://openalex.org/W6767887823","https://openalex.org/W6777141889","https://openalex.org/W6778883912","https://openalex.org/W6780448636","https://openalex.org/W6781051561","https://openalex.org/W6783507087","https://openalex.org/W6783904218","https://openalex.org/W6784337422","https://openalex.org/W6784572768","https://openalex.org/W6784628404","https://openalex.org/W6786517142","https://openalex.org/W6791145691"],"related_works":["https://openalex.org/W2062399876","https://openalex.org/W3008339103","https://openalex.org/W2404647514","https://openalex.org/W1667647204","https://openalex.org/W2607795551","https://openalex.org/W4247536566","https://openalex.org/W3119814709","https://openalex.org/W3155117723","https://openalex.org/W4300743398","https://openalex.org/W4312121420"],"abstract_inverted_index":{"A":[0],"high-quality":[1],"corpus":[2,16,38,52,76,278],"is":[3,53],"essential":[4],"for":[5,166,203,241,256,263],"building":[6,45],"an":[7,74],"effective":[8,145],"legal":[9,37,51,208,277],"intelligence":[10],"system.":[11],"The":[12,31,92,179,223,268],"quality":[13,20,26,33,108,114,213,231,245],"of":[14,21,27,35,101,115,157,195,206,247,259],"a":[15,36,46,54,62,207,248,254],"includes":[17],"both":[18],"the":[19,25,69,105,113,116,122,134,143,149,155,189,204,229,257,272,276],"original":[22],"data":[23,103,168,230,242,264],"and":[24,42,49,99,126,131,140,174,200,217,228,244,266,275,281],"its":[28,90],"corresponding":[29],"labeling.":[30],"major":[32,107],"dimensions":[34],"include":[39],"comprehensiveness,":[40,215],"freshness,":[41,216],"correctness.":[43],"However,":[44],"comprehensive,":[47],"correct,":[48],"fresh":[50],"grand":[55],"challenge.":[56,70],"In":[57,151],"this":[58,236],"article,":[59],"we":[60,160],"propose":[61],"semiautomated":[63,224],"machine":[64,163,225,260,269],"learning":[65,164,186,194,226,261,270],"framework":[66,227],"to":[67,88,147,153,220],"address":[68,148,154],"We":[71,124],"first":[72],"created":[73],"initial":[75,93],"with":[77,184,202],"4937":[78],"instances":[79],"that":[80,96,110,118,133,182],"were":[81,86],"manually":[82],"labeled.":[83],"Several":[84],"strategies":[85],"implemented":[87],"assure":[89],"quality.":[91],"results":[94,180],"showed":[95,181],"class":[97],"imbalance":[98],"insufficiency":[100,156],"training":[102,158,273],"are":[104,279],"two":[106],"issues":[109],"negatively":[111],"impacted":[112],"system":[117],"was":[119,142,198],"built":[120],"on":[121],"data.":[123],"experimented":[125,161,201],"compared":[127,219],"three":[128],"class-imbalance-handling":[129],"techniques":[130],"found":[132],"mixed-sampling":[135],"method,":[136],"which":[137,210],"combines":[138],"upsampling":[139],"downsampling,":[141],"most":[144],"way":[146],"issue.":[150],"order":[152],"data,":[159,274],"several":[162],"methods":[165,262],"automated":[167],"augmentation":[169,243,265],"including":[170],"pseudolabeling,":[171],"co-training,":[172],"expectation-maximization,":[173],"generative":[175],"adversarial":[176],"network":[177],"(GAN).":[178],"GAN":[183],"deep":[185],"models":[187],"achieved":[188],"best":[190],"performance.":[191],"Finally,":[192],"ensemble":[193],"different":[196],"classifiers":[197],"proposed":[199],"construction":[205],"corpus,":[209],"achieves":[211],"higher":[212],"in":[214,235],"correctness":[218],"existing":[221],"work.":[222],"evaluation":[232,246],"method":[233],"developed":[234],"research":[237],"can":[238],"be":[239],"used":[240],"large":[249],"dataset":[250],"as":[251,253],"well":[252],"reference":[255],"selection":[258],"generation.":[267],"models,":[271],"published":[280],"publicly":[282],"accessible":[283],"at":[284],"[Online].":[285],"Available:":[286],"<uri":[287],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[288],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/haihua0913/legalArgumentmining</uri>":[289],".":[290]},"counts_by_year":[{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":12}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
