{"id":"https://openalex.org/W2045178782","doi":"https://doi.org/10.1162/coli_r_00102","title":"<b>The Structure of Scientific Articles: Applications to Citation Indexing and Summarization Simone Teufel</b> (University of Cambridge) Stanford, CA: CSLI Publications (CSLI Studies in Computational Linguistics), 2010, xii+518 pp; hardbound, ISBN 978-1-57586-555-3, $70.00; paperbound, ISBN 978-1-57586-556-0, $32.50","display_name":"<b>The Structure of Scientific Articles: Applications to Citation Indexing and Summarization Simone Teufel</b> (University of Cambridge) Stanford, CA: CSLI Publications (CSLI Studies in Computational Linguistics), 2010, xii+518 pp; hardbound, ISBN 978-1-57586-555-3, $70.00; paperbound, ISBN 978-1-57586-556-0, $32.50","publication_year":2012,"publication_date":"2012-02-13","ids":{"openalex":"https://openalex.org/W2045178782","doi":"https://doi.org/10.1162/coli_r_00102","mag":"2045178782"},"language":"en","primary_location":{"id":"doi:10.1162/coli_r_00102","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_r_00102","pdf_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/COLI_r_00102","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/COLI_r_00102","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056001196","display_name":"Robert E. Mercer","orcid":"https://orcid.org/0000-0002-0080-715X"},"institutions":[{"id":"https://openalex.org/I101343708","display_name":"Mercer (Czechia)","ror":"https://ror.org/04c6pgy84","country_code":"CZ","type":"company","lineage":["https://openalex.org/I101343708"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"Robert E. Mercer","raw_affiliation_strings":["Robert E. Mercer is a Professor of Computer Science at the University of Western Ontario. His research interests include argumentation in science writing and annotation. Mercer's e-mail address is "],"affiliations":[{"raw_affiliation_string":"Robert E. Mercer is a Professor of Computer Science at the University of Western Ontario. His research interests include argumentation in science writing and annotation. Mercer's e-mail address is ","institution_ids":["https://openalex.org/I101343708"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5056001196"],"corresponding_institution_ids":["https://openalex.org/I101343708"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.09938832,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"38","issue":"2","first_page":"443","last_page":"445"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9210000038146973,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9210000038146973,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.9039143323898315},{"id":"https://openalex.org/keywords/citation","display_name":"Citation","score":0.6261339783668518},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5955591797828674},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4506932199001312},{"id":"https://openalex.org/keywords/library-science","display_name":"Library science","score":0.44212672114372253},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.37143585085868835},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.34273093938827515},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2569783926010132}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.9039143323898315},{"id":"https://openalex.org/C2778805511","wikidata":"https://www.wikidata.org/wiki/Q1713","display_name":"Citation","level":2,"score":0.6261339783668518},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5955591797828674},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4506932199001312},{"id":"https://openalex.org/C161191863","wikidata":"https://www.wikidata.org/wiki/Q199655","display_name":"Library science","level":1,"score":0.44212672114372253},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37143585085868835},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.34273093938827515},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2569783926010132}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1162/coli_r_00102","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_r_00102","pdf_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/COLI_r_00102","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:17ad1c3f517a4bc899d40a9afcf537f3","is_oa":true,"landing_page_url":"https://doaj.org/article/17ad1c3f517a4bc899d40a9afcf537f3","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computational Linguistics, Vol 38, Iss 2 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/coli_r_00102","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_r_00102","pdf_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/COLI_r_00102","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.800000011920929,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2045178782.pdf","grobid_xml":"https://content.openalex.org/works/W2045178782.grobid-xml"},"referenced_works_count":2,"referenced_works":["https://openalex.org/W205532704","https://openalex.org/W2250389127"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W3148229873","https://openalex.org/W4242223894","https://openalex.org/W2091301346","https://openalex.org/W2150160875","https://openalex.org/W1517524280","https://openalex.org/W4306886878","https://openalex.org/W2188505374","https://openalex.org/W1558342070"],"abstract_inverted_index":{"Discourse":[0,432],"models":[1,30,121,442,710],"have":[2,356],"received":[3],"significant":[4],"attention":[5],"in":[6,60,380,409,445,543,638,810,931,942,974,991,1088,1103,1139],"the":[7,16,22,148,161,169,176,188,191,194,217,235,260,263,267,284,327,331,372,381,385,399,407,410,429,439,462,511,530,549,558,561,567,579,585,593,598,604,612,620,627,648,653,659,662,665,674,680,689,697,700,708,713,737,743,751,754,763,770,784,788,793,811,815,821,863,866,871,875,886,912,915,919,932,943,976,982,996,1005,1015,1035,1045,1048,1053,1057,1064,1067,1075,1079,1084,1100,1104,1124,1150,1155],"computational":[8,387,400,613,739,764,1011],"linguistics":[9,401,614,740,765,1012],"community":[10],"with":[11,32,88,129,276,361,658],"some":[12,804,1042,1051,1118],"important":[13,58,463,681,938,953,971],"connections":[14],"to":[15,40,106,144,159,175,230,242,343,453,468,699,706,786,800,885,901,957,972,1073,1135,1141,1154],"non-computational":[17],"discourse":[18,25,63,109,120,220,328,441,933,946,993,1016,1058,1080],"community.":[19],"More":[20],"recently,":[21],"importance":[23],"of":[24,53,77,91,147,168,193,223,237,266,283,287,297,304,326,371,406,428,447,465,529,560,578,581,592,597,630,647,651,683,729,753,772,817,820,844,852,874,896,911,925,945,955,1004,1010,1030,1038,1047,1052,1066,1078,1086,1149],"annotation":[26,48,65,507,537,562,691,799,920,1126],"has":[27,214,483],"increased":[28],"as":[29,114,163,172,179,183,319,569,848,850,882],"generated":[31],"supervised":[33,702],"machine":[34,628],"learning":[35],"techniques":[36],"are":[37,150,317,337,351,378,412,443,532,541,636,686,1060],"being":[38,333,455],"used":[39,379,601,606,611,625,687,705],"annotate":[41],"text":[42,78,375,654],"automatically.":[43],"A":[44,575],"primary":[45],"area":[46,178],"for":[47,166,190,262,418,572,826,917,995,1002],"is":[49,56,70,99,127,234,421,473,480,491,736,746,970,989,1007,1019,1032,1107],"science.":[50],"The":[51,97,196,205,394,525,536,733,756],"theme":[52,265],"Teufel\u2019s":[54,83,108,415,1097],"book":[55,69,98,149,162,411,935,1006],"an":[57,173,281,295,425,796,883,902,937,952],"contribution":[59],"these":[61,730],"areas:":[62],"models,":[64],"schemes,":[66],"and":[67,79,94,101,122,133,203,225,233,251,254,292,313,346,392,494,521,527,556,617,633,664,717,724,726,742,778,792,842,922,928,939,948,950,1024,1034],"applications.The":[68],"a":[71,89,115,134,164,180,184,238,368,456,500,570,589,644,856,894,909,923,992,1008,1143],"substantial":[72],"work,":[73],"approximately":[74],"450":[75],"pages":[76],"appendices.":[80],"It":[81,472],"extends":[82],"Ph.D.":[84],"thesis":[85],"(Teufel":[86],"2000)":[87],"decade":[90],"new":[92,131,309,449],"work":[93,956],"updated":[95],"references.":[96],"content-rich":[100],"meticulously":[102],"written.":[103],"In":[104,451,865],"addition":[105,452],"presenting":[107],"model,":[110],"it":[111,454,482,490,869,969],"also":[112,879],"works":[113],"good":[116,576],"entry":[117],"point":[118],"into":[119,855],"annotation.":[123],"Because":[124],"each":[125,136,167],"chapter":[126,137,395,768],"structured":[128],"background,":[130],"material,":[132],"summary,":[135],"can":[138,273,340,961],"be":[139,274,341,624,1092,1136],"read":[140],"somewhat":[141],"independently.":[142],"Cross-references":[143],"other":[145,605,959],"parts":[146],"carefully":[151,533],"included":[152],"where":[153],"warranted.":[154],"This":[155,767,877,1027],"structure":[156,1039],"lends":[157],"itself":[158,657],"using":[160,564],"reference":[165],"subtopics":[170],"or":[171,363,963],"introduction":[174,884],"subject":[177],"whole,":[181],"suitable":[182],"textbook.Chapter":[185],"1":[186],"sets":[187,198],"stage":[189],"rest":[192],"book.":[195,876,1049],"author":[197,663],"out":[199,461],"her":[200,448,1000],"fundamental":[201,206,1054],"assumptions":[202,207],"hypotheses.":[204],"arise":[208],"from":[209,795],"three":[210,506,602],"observations":[211],"that":[212,279,316,329,339,355,377,552,622,635,655,678,685,711,835,898,987,1123],"she":[213,459,988],"made":[215],"regarding":[216,1056],"literature.":[218],"Scientific":[219],"contains":[221,228,330,424],"descriptions":[222],"positive":[224],"negative":[226],"states,":[227],"references":[229],"others\u2019":[231],"contributions,":[232],"result":[236],"rhetorical":[239,285,311,362,747,1025],"game":[240],"intended":[241],"promote":[243],"one\u2019s":[244],"contribution.":[245],"Chapter":[246,255,300,639,641,671,693,720,860],"2,":[247],"on":[248,257,398,403,510,548,762,1021],"information":[249,320,332],"retrieval":[250],"citation":[252,314,353,358],"indexes,":[253],"3,":[256],"summarization,":[258],"provide":[259],"motivation":[261],"main":[264,872],"book:":[268,386,983],"These":[269],"two":[270,308,1068],"information-based":[271],"endeavors":[272],"enhanced":[275,323],"automated":[277],"tools":[278,825],"incorporate":[280],"understanding":[282],"aspects":[286,464,682],"science":[288,419,1033,1089],"writing.Whereas":[289],"Chapters":[290],"2":[291,892],"3":[293],"give":[294],"overview":[296],"current":[298],"methodologies,":[299],"4,":[301],"\u201cNew":[302],"Types":[303],"Information":[305],"Access,\u201d":[306],"introduces":[307,696],"techniques,":[310],"extracts":[312,336],"maps,":[315],"suggested":[318],"navigation":[321,347],"methods":[322,841],"by":[324,588,626,688,1063,1096,1131],"knowledge":[325,479,1022],"accessed.":[334],"Rhetorical":[335,469],"snippets":[338],"tailored":[342],"user":[344],"expertise":[345],"task.":[348],"Citation":[349,517],"maps":[350],"interactive":[352],"indexes":[354],"their":[357,965],"links":[359],"augmented":[360],"sentiment":[364],"information.Chapter":[365],"5":[366],"gives":[367,436],"detailed":[369,590],"description":[370,427],"five":[373],"scientific":[374,827,832,846],"corpora":[376],"research":[382,808],"described":[383,637],"throughout":[384],"linguistics,":[388],"chemistry,":[389,773],"genetics,":[390],"cardiology,":[391],"agriculture.":[393],"focuses":[396],"primarily":[397],"corpus,":[402],"which":[404,802,958],"most":[405],"results":[408,759],"based.":[413],"SciXML,":[414,918],"markup":[416],"language":[417],"articles,":[420,914],"described.Chapter":[422],"6":[423],"in-depth":[426],"Knowledge":[430,513],"Claim":[431,514],"Model":[433],"(KCDM).":[434],"Teufel":[435,985],"reasons":[437],"why":[438],"traditional":[440],"abandoned":[444],"favor":[446],"model.":[450,1081],"shallow":[457],"method,":[458],"points":[460,979],"KCDM":[466,790,822],"(compared":[467],"Structure":[470],"Theory):":[471],"text-type-specific":[474],"(scientific":[475],"articles);":[476],"no":[477],"world":[478],"required;":[481],"global":[484],"(top-down)":[485],"not":[486,498],"local":[487],"(bottom-up)":[488],"relations;":[489],"non-hierarchical":[492],"(citation":[493],"summarization":[495],"applications":[496],"do":[497],"require":[499],"rich":[501],"hierarchical":[502],"structure).Chapter":[503],"7":[504],"presents":[505,722],"schemes":[508,531],"based":[509,761,1020],"KCDM:":[512],"Attribution":[515],"(KCA),":[516],"Function":[518],"Classification":[519],"(CFC),":[520],"Argumentative":[522],"Zoning":[523],"(AZ).":[524],"background":[526],"purpose":[528],"laid":[534],"out.":[535],"guidelines":[538],"(coding":[539],"manuals)":[540],"given":[542,1044],"Appendix":[544],"C.Chapter":[545],"8":[546],"reports":[547],"reliability":[550],"studies":[551,600,610],"use":[553],"human":[554],"annotators":[555,568],"gauge":[557],"quality":[559],"scheme":[563],"agreement":[565,583],"among":[566],"proxy":[571],"this":[573],"measure.":[574],"discussion":[577,646],"measures":[580],"annotator":[582],"opens":[584],"chapter,":[586],"followed":[587],"analysis":[591],"four":[594,599,906],"studies.":[595],"Three":[596],"annotators,":[603],"18":[607],"annotators.":[608,719],"All":[609],"corpus.Chapters":[615],"9":[616,642],"10":[618,672],"discuss":[619],"features":[621,677],"will":[623],"implementations":[629],"AZ,":[631,715],"KCA,":[632,716],"CFC":[634,718],"11.":[640],"provides":[643,862,951],"comprehensive":[645],"various":[649],"embodiments":[650],"meta-discourse,":[652],"concerns":[656],"dialogue":[660],"between":[661],"reader":[666,698],"rather":[667],"than":[668,1094,1110],"content-bearing":[669],"text.":[670],"discusses":[673],"computable":[675],"surface":[676],"capture":[679],"meta-discourse":[684],"automatic":[690,714,731,829,853,904,1151],"methods.":[692,732],"11":[694],"then":[695],"standard":[701,735],"machine-learning":[703],"methodology":[704],"generate":[707],"statistical":[709],"implement":[712],"12":[721],"gold-standard,":[723],"extrinsic":[725,744],"subjective":[727],"evaluations":[728],"gold":[734,1146],"human-annotated":[738],"articles":[741],"task":[745],"extracts.Chapter":[748],"13":[749],"investigates":[750],"universality":[752],"KCDM.":[755],"earlier":[757],"chapters\u2019":[758],"were":[760],"corpus.":[766],"considers":[769],"disciplines":[771],"computer":[774],"science,":[775],"biology,":[776],"astrophysics,":[777],"legal":[779],"texts.":[780],"Two":[781],"issues":[782],"surface:":[783],"need":[785,1134],"modify":[787],"original":[789],"slightly,":[791],"move":[794],"absolutely":[797],"domain-knowledge-free":[798,1125],"one":[801,1072],"includes":[803],"high-level":[805],"facts":[806],"about":[807],"practices":[809],"discipline.Chapter":[812],"14":[813],"pushes":[814],"frontiers":[816],"potential":[818],"uses":[819],"methodology:":[823],"support":[824],"writing,":[828],"review":[830],"generation,":[831],"summary":[833],"generation":[834],"moves":[836],"beyond":[837],"simple":[838],"sentence":[839],"extraction":[840],"summaries":[843],"multiple":[845],"documents,":[847],"well":[849],"integration":[851],"AZ":[854],"large-scale":[857],"digital":[858],"library.":[859],"15":[861],"conclusion.":[864],"first":[867],"section":[868,878],"recapitulates":[870],"themes":[873],"nicely":[880],"serves":[881],"book,":[887],"if":[888],"so":[889],"desired.":[890],"Section":[891],"lists":[893],"number":[895],"areas":[897],"could":[899],"lead":[900],"improved":[903],"system.The":[905],"appendices":[907],"contain":[908],"list":[910],"CmpLG-D":[913],"DTD":[916],"guidelines,":[921],"catalog":[924],"lexical":[926],"items":[927],"patterns":[929],"useful":[930],"setting.The":[934],"makes":[936],"powerful":[940],"statement":[941],"field":[944],"modeling":[947],"annotation,":[949],"body":[954],"researchers":[960,1119],"add":[962],"compare":[964],"work.":[966],"I":[967],"think":[968],"keep":[973],"mind":[975],"following":[977],"few":[978],"while":[980],"reading":[981],"First,":[984],"comments":[986],"interested":[990],"model":[994,1017,1059],"experimental":[997],"sciences,":[998],"yet":[999],"focus":[1001],"much":[1003],"corpus":[1009],"papers.":[1013],"Also,":[1014],"proposed":[1018],"claims":[1023],"moves.":[1026],"catholic":[1028],"view":[1029,1037],"what":[1031],"narrow":[1036],"may":[1040,1091,1133],"surprise":[1041],"readers":[1043],"title":[1046],"Next,":[1050],"decisions":[1055],"heavily":[1061],"influenced":[1062],"requirements":[1065],"motivational":[1069],"topics,":[1070],"leading":[1071],"question":[1074],"full":[1076],"generality":[1077],"As":[1082],"well,":[1083],"range":[1085],"rhetoric":[1087],"writing":[1090],"broader":[1093],"anticipated":[1095],"model\u2014for":[1098],"example,":[1099],"style":[1101],"found":[1102],"geology":[1105],"discipline":[1106],"more":[1108,1144],"cumulative":[1109],"critical":[1111],"(Heather":[1112],"Graves,":[1113],"personal":[1114],"communication).":[1115],"And":[1116],"finally,":[1117],"(White":[1120],"2010)":[1121],"argue":[1122],"dictum,":[1127],"although":[1128],"loosened":[1129],"slightly":[1130],"Teufel,":[1132],"further":[1137],"relaxed":[1138],"order":[1140],"produce":[1142],"accurate":[1145],"standard,":[1147],"regardless":[1148],"system\u2019s":[1152],"access":[1153],"same":[1156],"domain":[1157],"knowledge.":[1158]},"counts_by_year":[{"year":2016,"cited_by_count":1}],"updated_date":"2026-02-24T19:35:01.260952","created_date":"2016-06-24T00:00:00"}
