{"id":"https://openalex.org/W7128530704","doi":"https://doi.org/10.48550/arxiv.2602.07382","title":"Advantages of Domain Knowledge Injection for Legal Document Summarization: A Case Study on Summarizing Indian Court Judgments in English and Hindi","display_name":"Advantages of Domain Knowledge Injection for Legal Document Summarization: A Case Study on Summarizing Indian Court Judgments in English and Hindi","publication_year":2026,"publication_date":"2026-02-07","ids":{"openalex":"https://openalex.org/W7128530704","doi":"https://doi.org/10.48550/arxiv.2602.07382"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.07382","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104190342","display_name":"Debtanu Datta","orcid":"https://orcid.org/0009-0008-9568-2062"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Datta, Debtanu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125554315","display_name":"Rajdeep Mukherjee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mukherjee, Rajdeep","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091712265","display_name":"Adrijit Goswami","orcid":"https://orcid.org/0000-0002-4420-0077"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goswami, Adrijit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125559063","display_name":"Saptarshi Ghosh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ghosh, Saptarshi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5104190342"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8636999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8636999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.03889999911189079,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.023499999195337296,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hindi","display_name":"Hindi","score":0.8122000098228455},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.7778000235557556},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.529699981212616},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4366999864578247},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.42669999599456787},{"id":"https://openalex.org/keywords/legal-document","display_name":"Legal document","score":0.3725000023841858},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.36250001192092896}],"concepts":[{"id":"https://openalex.org/C519982507","wikidata":"https://www.wikidata.org/wiki/Q1568","display_name":"Hindi","level":2,"score":0.8122000098228455},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.7778000235557556},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6427000164985657},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6134999990463257},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5593000054359436},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.529699981212616},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4366999864578247},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.42669999599456787},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4043999910354614},{"id":"https://openalex.org/C2993995455","wikidata":"https://www.wikidata.org/wiki/Q3150005","display_name":"Legal document","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.3450999855995178},{"id":"https://openalex.org/C2780129039","wikidata":"https://www.wikidata.org/wiki/Q1931107","display_name":"Section (typography)","level":2,"score":0.3402999937534332},{"id":"https://openalex.org/C2778049185","wikidata":"https://www.wikidata.org/wiki/Q2334719","display_name":"Legal case","level":2,"score":0.289900004863739},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C522695570","wikidata":"https://www.wikidata.org/wiki/Q6517578","display_name":"Legal research","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.25360000133514404}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.07382","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.07382","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.07382","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.07382","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.5949631929397583,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Summarizing":[0],"Indian":[1,31,49,61,76,144],"legal":[2,21,41,62,103,111,126,145,158],"court":[3],"judgments":[4],"is":[5,43],"a":[6,26,88],"complex":[7,37],"task":[8],"not":[9,34],"only":[10],"due":[11],"to":[12,56,64,90],"the":[13,20,30,36,58,108,170],"intricate":[14],"language":[15],"and":[16,70,130,142,157],"unstructured":[17],"nature":[18],"of":[19,29,60,110,172],"texts,":[22],"but":[23],"also":[24],"since":[25],"large":[27,125],"section":[28],"population":[32],"does":[33],"understand":[35],"English":[38,69,129],"in":[39,48,67,128,139],"which":[40],"text":[42,63],"written,":[44],"thus":[45],"requiring":[46],"summaries":[47,66],"languages.":[50],"In":[51],"this":[52],"study,":[53],"we":[54,106],"aim":[55],"improve":[57],"summarization":[59,84,94],"generate":[65],"both":[68,140],"Hindi":[71],"(the":[72],"most":[73],"widely":[74],"spoken":[75],"language),":[77],"by":[78,96,150],"injecting":[79],"domain":[80,112,167],"knowledge":[81,113],"into":[82,114],"diverse":[83],"models.":[85],"We":[86],"propose":[87],"framework":[89],"enhance":[91],"extractive":[92],"neural":[93],"models":[95,116],"incorporating":[97],"domain-specific":[98,159],"pre-trained":[99],"encoders":[100],"tailored":[101],"for":[102],"texts.":[104],"Further,":[105],"explore":[107],"injection":[109],"generative":[115],"(including":[117],"Large":[118],"Language":[119],"Models)":[120],"through":[121,166],"continual":[122],"pre-training":[123],"on":[124],"corpora":[127],"Hindi.":[131],"Our":[132],"proposed":[133],"approaches":[134],"achieve":[135],"statistically":[136],"significant":[137],"improvements":[138,163],"English-to-English":[141],"English-to-Hindi":[143],"document":[146],"summarization,":[147],"as":[148],"measured":[149],"standard":[151],"evaluation":[152],"metrics,":[153,156],"factual":[154],"consistency":[155],"metrics.":[160],"Furthermore,":[161],"these":[162],"are":[164],"validated":[165],"experts,":[168],"demonstrating":[169],"effectiveness":[171],"our":[173],"approaches.":[174]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-02-11T00:00:00"}
