{"id":"https://openalex.org/W2979899153","doi":"https://doi.org/10.1162/coli_a_00360","title":"Discourse in Multimedia: A Case Study in Extracting Geometry Knowledge from Textbooks","display_name":"Discourse in Multimedia: A Case Study in Extracting Geometry Knowledge from Textbooks","publication_year":2019,"publication_date":"2019-10-08","ids":{"openalex":"https://openalex.org/W2979899153","doi":"https://doi.org/10.1162/coli_a_00360","mag":"2979899153"},"language":"en","primary_location":{"id":"doi:10.1162/coli_a_00360","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_a_00360","pdf_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/coli_a_00360","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/coli_a_00360","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002316432","display_name":"Mrinmaya Sachan","orcid":"https://orcid.org/0000-0001-8787-8681"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mrinmaya Sachan","raw_affiliation_strings":["Carnegie Mellon University, School of Computer Science, Machine Learning Department"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, School of Computer Science, Machine Learning Department","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047098924","display_name":"Avinava Dubey","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Avinava Dubey","raw_affiliation_strings":["Carnegie Mellon University, School of Computer Science, Machine Learning Department"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, School of Computer Science, Machine Learning Department","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060225743","display_name":"Eduard Hovy","orcid":"https://orcid.org/0000-0002-3270-7903"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eduard H. Hovy","raw_affiliation_strings":["Carnegie Mellon University, School of Computer Science, Language Technologies Institute"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, School of Computer Science, Language Technologies Institute","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102921433","display_name":"Tom M. Mitchell","orcid":"https://orcid.org/0000-0001-7373-0301"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tom M. Mitchell","raw_affiliation_strings":["Carnegie Mellon University, School of Computer Science, Machine Learning Department"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, School of Computer Science, Machine Learning Department","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023802054","display_name":"Dan Roth","orcid":"https://orcid.org/0009-0002-1447-5173"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dan Roth","raw_affiliation_strings":["University of Pennsylvania, Department of Computer and Information Science"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania, Department of Computer and Information Science","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009547049","display_name":"Eric P. Xing","orcid":"https://orcid.org/0009-0005-9158-4201"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eric P. Xing","raw_affiliation_strings":["Carnegie Mellon University, School of Computer Science, Machine Learning Department"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, School of Computer Science, Machine Learning Department","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5002316432"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":1.6802,"has_fulltext":true,"cited_by_count":22,"citation_normalized_percentile":{"value":0.88506695,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"45","issue":"4","first_page":"627","last_page":"665"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/disk-formatting","display_name":"Disk formatting","score":0.9028838276863098},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8064877986907959},{"id":"https://openalex.org/keywords/readability","display_name":"Readability","score":0.7425878047943115},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6159242391586304},{"id":"https://openalex.org/keywords/text-linguistics","display_name":"Text linguistics","score":0.47428208589553833},{"id":"https://openalex.org/keywords/thematic-structure","display_name":"Thematic structure","score":0.4351580739021301},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.430908203125},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.4215778708457947},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.42048782110214233},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3938031792640686}],"concepts":[{"id":"https://openalex.org/C88006597","wikidata":"https://www.wikidata.org/wiki/Q690117","display_name":"Disk formatting","level":2,"score":0.9028838276863098},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8064877986907959},{"id":"https://openalex.org/C2778143727","wikidata":"https://www.wikidata.org/wiki/Q1820650","display_name":"Readability","level":2,"score":0.7425878047943115},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6159242391586304},{"id":"https://openalex.org/C64417998","wikidata":"https://www.wikidata.org/wiki/Q1206895","display_name":"Text linguistics","level":2,"score":0.47428208589553833},{"id":"https://openalex.org/C2778109090","wikidata":"https://www.wikidata.org/wiki/Q7781195","display_name":"Thematic structure","level":2,"score":0.4351580739021301},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.430908203125},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.4215778708457947},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.42048782110214233},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3938031792640686},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1162/coli_a_00360","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_a_00360","pdf_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/coli_a_00360","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:dc8f38f4640e4e158191ebcbb5855a15","is_oa":true,"landing_page_url":"https://doaj.org/article/dc8f38f4640e4e158191ebcbb5855a15","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computational Linguistics, Vol 45, Iss 4, Pp 627-665 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/coli_a_00360","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_a_00360","pdf_url":"https://www.mitpressjournals.org/doi/pdf/10.1162/coli_a_00360","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8799999952316284,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2979899153.pdf","grobid_xml":"https://content.openalex.org/works/W2979899153.grobid-xml"},"referenced_works_count":133,"referenced_works":["https://openalex.org/W41611457","https://openalex.org/W55989445","https://openalex.org/W64910274","https://openalex.org/W71631801","https://openalex.org/W120297271","https://openalex.org/W263614502","https://openalex.org/W357519574","https://openalex.org/W767947605","https://openalex.org/W890580221","https://openalex.org/W998330076","https://openalex.org/W1493490255","https://openalex.org/W1496737558","https://openalex.org/W1498682480","https://openalex.org/W1504725289","https://openalex.org/W1505520120","https://openalex.org/W1509595041","https://openalex.org/W1539633941","https://openalex.org/W1544505229","https://openalex.org/W1545396636","https://openalex.org/W1548163180","https://openalex.org/W1563792215","https://openalex.org/W1594973830","https://openalex.org/W1597655096","https://openalex.org/W1599381846","https://openalex.org/W1602510369","https://openalex.org/W1606427739","https://openalex.org/W1628475528","https://openalex.org/W1633301614","https://openalex.org/W1637480429","https://openalex.org/W1659846831","https://openalex.org/W1920406848","https://openalex.org/W1972398108","https://openalex.org/W1978081087","https://openalex.org/W1981791873","https://openalex.org/W1990100773","https://openalex.org/W2010353619","https://openalex.org/W2015812272","https://openalex.org/W2034183571","https://openalex.org/W2045738181","https://openalex.org/W2049931505","https://openalex.org/W2053860863","https://openalex.org/W2056531976","https://openalex.org/W2057277029","https://openalex.org/W2060565333","https://openalex.org/W2069684104","https://openalex.org/W2070789508","https://openalex.org/W2077378514","https://openalex.org/W2083330748","https://openalex.org/W2085574295","https://openalex.org/W2097898123","https://openalex.org/W2100023842","https://openalex.org/W2102506621","https://openalex.org/W2107618763","https://openalex.org/W2114114835","https://openalex.org/W2115007594","https://openalex.org/W2118781169","https://openalex.org/W2119807359","https://openalex.org/W2120136138","https://openalex.org/W2120691627","https://openalex.org/W2121406004","https://openalex.org/W2123442489","https://openalex.org/W2127635582","https://openalex.org/W2127978399","https://openalex.org/W2129804798","https://openalex.org/W2132881639","https://openalex.org/W2134150392","https://openalex.org/W2135336649","https://openalex.org/W2147258359","https://openalex.org/W2147880316","https://openalex.org/W2148404145","https://openalex.org/W2149367074","https://openalex.org/W2151115083","https://openalex.org/W2154407881","https://openalex.org/W2154652894","https://openalex.org/W2156021548","https://openalex.org/W2158211888","https://openalex.org/W2158396456","https://openalex.org/W2158570207","https://openalex.org/W2161002933","https://openalex.org/W2163274265","https://openalex.org/W2167702024","https://openalex.org/W2168065722","https://openalex.org/W2170732969","https://openalex.org/W2173426956","https://openalex.org/W2179053401","https://openalex.org/W2241862190","https://openalex.org/W2250249423","https://openalex.org/W2250362537","https://openalex.org/W2250424758","https://openalex.org/W2250432970","https://openalex.org/W2250564385","https://openalex.org/W2251199281","https://openalex.org/W2251249019","https://openalex.org/W2251293245","https://openalex.org/W2251355301","https://openalex.org/W2252136820","https://openalex.org/W2252267789","https://openalex.org/W2304240348","https://openalex.org/W2307512708","https://openalex.org/W2343487696","https://openalex.org/W2502443097","https://openalex.org/W2514190896","https://openalex.org/W2520300089","https://openalex.org/W2532161561","https://openalex.org/W2553246593","https://openalex.org/W2559655401","https://openalex.org/W2594782638","https://openalex.org/W2608651664","https://openalex.org/W2613000335","https://openalex.org/W2615071493","https://openalex.org/W2746097825","https://openalex.org/W2911267749","https://openalex.org/W2918008835","https://openalex.org/W2930957955","https://openalex.org/W2941620504","https://openalex.org/W2951278025","https://openalex.org/W2951719623","https://openalex.org/W2962800603","https://openalex.org/W2963617989","https://openalex.org/W3037679343","https://openalex.org/W3104376605","https://openalex.org/W3126976873","https://openalex.org/W3143504415","https://openalex.org/W3147653952","https://openalex.org/W3158633990","https://openalex.org/W4231741839","https://openalex.org/W4242912959","https://openalex.org/W4249550410","https://openalex.org/W4254611763","https://openalex.org/W4285719527","https://openalex.org/W4298382214","https://openalex.org/W4381925011","https://openalex.org/W4402715029"],"related_works":["https://openalex.org/W4223983815","https://openalex.org/W2895083663","https://openalex.org/W3040659826","https://openalex.org/W3185130901","https://openalex.org/W2610081246","https://openalex.org/W4312674007","https://openalex.org/W2368099769","https://openalex.org/W2036710212","https://openalex.org/W2347764438","https://openalex.org/W3217362626"],"abstract_inverted_index":{"To":[0],"ensure":[1],"readability,":[2],"text":[3,13,65,90,123],"is":[4,129],"often":[5],"written":[6],"and":[7,39,91,122],"presented":[8],"with":[9],"due":[10],"formatting.":[11],"These":[12],"formatting":[14,68],"devices":[15],"help":[16,29],"the":[17,22,25,30,34,37,41,98,120,139],"writer":[18],"to":[19,108,131,146],"effectively":[20],"convey":[21],"narrative.":[23],"At":[24],"same":[26],"time,":[27],"these":[28,58,85,106],"readers":[31],"pick":[32],"up":[33],"structure":[35,54],"of":[36,49,55,84,113],"discourse":[38,53,86,121],"comprehend":[40],"conveyed":[42],"information.":[43,134],"There":[44],"have":[45],"been":[46],"a":[47,101],"number":[48],"linguistic":[50],"theories":[51,59],"on":[52],"text.":[56,63],"However,":[57],"only":[60],"consider":[61],"unformatted":[62],"Multimedia":[64],"contains":[66],"rich":[67],"features":[69,87,107,125],"that":[70,119,128,138],"can":[71,143],"be":[72,144],"leveraged":[73],"for":[74,151],"various":[75],"NLP":[76],"tasks.":[77],"In":[78],"this":[79],"article,":[80],"we":[81,104,136],"study":[82],"some":[83],"in":[88,97],"multimedia":[89],"what":[92],"communicative":[93],"function":[94],"they":[95],"fulfill":[96],"context.":[99],"As":[100],"case":[102],"study,":[103],"use":[105],"harvest":[109],"structured":[110,141],"subject":[111],"knowledge":[112,142],"geometry":[114,152],"from":[115],"textbooks.":[116],"We":[117],"conclude":[118],"layout":[124],"provide":[126],"information":[127],"complementary":[130],"lexical":[132],"semantic":[133],"Finally,":[135],"show":[137],"harvested":[140],"used":[145],"improve":[147],"an":[148],"existing":[149],"solver":[150],"problems,":[153],"making":[154],"it":[155],"more":[156,161],"accurate":[157],"as":[158,160],"well":[159],"explainable.":[162]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
