{"id":"https://openalex.org/W3163699936","doi":"https://doi.org/10.1145/3462757.3466085","title":"Structural text segmentation of legal documents","display_name":"Structural text segmentation of legal documents","publication_year":2021,"publication_date":"2021-06-21","ids":{"openalex":"https://openalex.org/W3163699936","doi":"https://doi.org/10.1145/3462757.3466085","mag":"3163699936"},"language":"en","primary_location":{"id":"doi:10.1145/3462757.3466085","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3462757.3466085","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eighteenth International Conference on Artificial Intelligence and Law","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2012.03619","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039484875","display_name":"Dennis Aumiller","orcid":"https://orcid.org/0000-0001-8296-6797"},"institutions":[{"id":"https://openalex.org/I223822909","display_name":"Heidelberg University","ror":"https://ror.org/038t36y30","country_code":"DE","type":"education","lineage":["https://openalex.org/I223822909"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Dennis Aumiller","raw_affiliation_strings":["Heidelberg University, Heidelberg, Germany"],"affiliations":[{"raw_affiliation_string":"Heidelberg University, Heidelberg, Germany","institution_ids":["https://openalex.org/I223822909"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081759761","display_name":"Satya Almasian","orcid":"https://orcid.org/0000-0002-1884-0484"},"institutions":[{"id":"https://openalex.org/I223822909","display_name":"Heidelberg University","ror":"https://ror.org/038t36y30","country_code":"DE","type":"education","lineage":["https://openalex.org/I223822909"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Satya Almasian","raw_affiliation_strings":["Heidelberg University, Heidelberg, Germany"],"affiliations":[{"raw_affiliation_string":"Heidelberg University, Heidelberg, Germany","institution_ids":["https://openalex.org/I223822909"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076226398","display_name":"Sebastian Lackner","orcid":null},"institutions":[{"id":"https://openalex.org/I223822909","display_name":"Heidelberg University","ror":"https://ror.org/038t36y30","country_code":"DE","type":"education","lineage":["https://openalex.org/I223822909"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sebastian Lackner","raw_affiliation_strings":["Heidelberg University, Heidelberg, Germany"],"affiliations":[{"raw_affiliation_string":"Heidelberg University, Heidelberg, Germany","institution_ids":["https://openalex.org/I223822909"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061021795","display_name":"Michael Gertz","orcid":"https://orcid.org/0000-0003-4530-6110"},"institutions":[{"id":"https://openalex.org/I223822909","display_name":"Heidelberg University","ror":"https://ror.org/038t36y30","country_code":"DE","type":"education","lineage":["https://openalex.org/I223822909"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Michael Gertz","raw_affiliation_strings":["Heidelberg University, Heidelberg, Germany"],"affiliations":[{"raw_affiliation_string":"Heidelberg University, Heidelberg, Germany","institution_ids":["https://openalex.org/I223822909"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5039484875"],"corresponding_institution_ids":["https://openalex.org/I223822909"],"apc_list":null,"apc_paid":null,"fwci":20.935,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.99202003,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8620448112487793},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6882914900779724},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5714789032936096},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.5117313861846924},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4864075183868408},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.48499032855033875},{"id":"https://openalex.org/keywords/downstream","display_name":"Downstream (manufacturing)","score":0.48066627979278564},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.466489315032959},{"id":"https://openalex.org/keywords/market-segmentation","display_name":"Market segmentation","score":0.45955124497413635},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.45034122467041016},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4368165135383606},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32730725407600403}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8620448112487793},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6882914900779724},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5714789032936096},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.5117313861846924},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4864075183868408},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.48499032855033875},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.48066627979278564},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.466489315032959},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.45955124497413635},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.45034122467041016},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4368165135383606},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32730725407600403},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3462757.3466085","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3462757.3466085","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eighteenth International Conference on Artificial Intelligence and Law","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2012.03619","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2012.03619","pdf_url":"https://arxiv.org/pdf/2012.03619","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2012.03619","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2012.03619","pdf_url":"https://arxiv.org/pdf/2012.03619","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7200000286102295}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W1514981065","https://openalex.org/W1557074680","https://openalex.org/W1590118338","https://openalex.org/W1626945812","https://openalex.org/W1781198478","https://openalex.org/W1828401780","https://openalex.org/W1862888253","https://openalex.org/W1880262756","https://openalex.org/W1969351518","https://openalex.org/W1979469248","https://openalex.org/W1989896487","https://openalex.org/W2017776283","https://openalex.org/W2065840553","https://openalex.org/W2070811760","https://openalex.org/W2080179128","https://openalex.org/W2100626830","https://openalex.org/W2100873065","https://openalex.org/W2104210067","https://openalex.org/W2107743791","https://openalex.org/W2112971401","https://openalex.org/W2118612506","https://openalex.org/W2120101509","https://openalex.org/W2148818577","https://openalex.org/W2149041454","https://openalex.org/W2250539671","https://openalex.org/W2346917897","https://openalex.org/W2406834049","https://openalex.org/W2512217112","https://openalex.org/W2596512067","https://openalex.org/W2799051010","https://openalex.org/W2882319491","https://openalex.org/W2888922453","https://openalex.org/W2896457183","https://openalex.org/W2918995630","https://openalex.org/W2946065814","https://openalex.org/W2953979308","https://openalex.org/W2955290639","https://openalex.org/W2955781381","https://openalex.org/W2962716111","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2965373594","https://openalex.org/W2970641574","https://openalex.org/W2980282514","https://openalex.org/W2997244287","https://openalex.org/W2998609982","https://openalex.org/W3045464143","https://openalex.org/W3108142956","https://openalex.org/W4231510805","https://openalex.org/W4233135949","https://openalex.org/W4233620316","https://openalex.org/W4238205294","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2592395359","https://openalex.org/W2535231171","https://openalex.org/W2045342254","https://openalex.org/W1501331687","https://openalex.org/W2326647871","https://openalex.org/W4205247302","https://openalex.org/W2468652214","https://openalex.org/W2501551404","https://openalex.org/W1504527458","https://openalex.org/W2130144716"],"abstract_inverted_index":{"The":[0],"growing":[1],"complexity":[2],"of":[3,49,56,91,117,134,151,181],"legal":[4,13,182],"cases":[5],"has":[6],"lead":[7],"to":[8,31,178,191],"an":[9],"increasing":[10],"interest":[11],"in":[12],"information":[14,22],"retrieval":[15],"systems":[16,27],"that":[17,86,137,168],"can":[18,87],"effectively":[19,98],"satisfy":[20],"user-specific":[21],"needs.":[23],"However,":[24],"such":[25],"downstream":[26,109],"typically":[28],"require":[29],"documents":[30],"be":[32],"properly":[33],"formatted":[34],"and":[35,102,121,175,188],"segmented,":[36],"which":[37,61,69,161],"is":[38],"often":[39],"done":[40],"with":[41],"relatively":[42],"simple":[43],"pre-processing":[44],"steps,":[45],"disregarding":[46],"topical":[47,89,127],"coherence":[48,90],"segments.":[50],"Systems":[51],"generally":[52],"rely":[53],"on":[54,115,142],"representations":[55],"individual":[57],"sentences":[58],"or":[59,66],"paragraphs,":[60,97],"may":[62],"lack":[63],"crucial":[64],"context,":[65],"document-level":[67],"representations,":[68],"are":[70],"too":[71],"long":[72],"for":[73,108,139,164,195],"meaningful":[74],"search":[75],"results.":[76],"To":[77],"address":[78],"this":[79],"issue,":[80],"we":[81,162],"propose":[82],"a":[83,100,104,132,147],"segmentation":[84,125],"system":[85,171],"predict":[88],"sequential":[92],"text":[93,124],"segments":[94],"spanning":[95],"several":[96],"segmenting":[99],"document":[101],"providing":[103],"more":[105],"balanced":[106],"representation":[107],"applications.":[110],"We":[111,145,184],"build":[112],"our":[113,169],"model":[114],"top":[116],"popular":[118],"transformer":[119],"networks":[120],"formulate":[122],"structural":[123,179],"as":[126],"change":[128],"detection,":[129],"by":[130],"performing":[131],"series":[133],"independent":[135],"classifications":[136],"allow":[138],"efficient":[140],"fine-tuning":[141],"task-specific":[143],"data.":[144],"crawl":[146],"novel":[148],"dataset":[149],"consisting":[150],"roughly":[152],"74,000":[153],"online":[154],"Terms-of-Service":[155],"documents,":[156],"including":[157],"hierarchical":[158],"topic":[159],"annotations,":[160],"use":[163],"training.":[165],"Results":[166],"show":[167],"proposed":[170],"significantly":[172],"outperforms":[173],"baselines,":[174],"adapts":[176],"well":[177],"peculiarities":[180],"documents.":[183],"release":[185],"both":[186],"data":[187],"trained":[189],"models":[190],"the":[192],"research":[193],"community":[194],"future":[196],"work.1":[197]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
