{"id":"https://openalex.org/W2974201160","doi":"https://doi.org/10.1145/3342558.3345426","title":"Semi-Automatic LaTeX-Based Labeling of Mathematical Objects in PDF Documents","display_name":"Semi-Automatic LaTeX-Based Labeling of Mathematical Objects in PDF Documents","publication_year":2019,"publication_date":"2019-09-19","ids":{"openalex":"https://openalex.org/W2974201160","doi":"https://doi.org/10.1145/3342558.3345426","mag":"2974201160"},"language":"en","primary_location":{"id":"doi:10.1145/3342558.3345426","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3342558.3345426","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Symposium on Document Engineering 2019","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029377307","display_name":"Donald Beyette","orcid":"https://orcid.org/0000-0002-7948-7768"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Donald Beyette","raw_affiliation_strings":["Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100746483","display_name":"Zelun Wang","orcid":"https://orcid.org/0000-0002-1882-2526"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zelun Wang","raw_affiliation_strings":["Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002371782","display_name":"Jason Lin","orcid":"https://orcid.org/0000-0001-8013-9923"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason Lin","raw_affiliation_strings":["Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024732465","display_name":"Jyh\u2010Charn Liu","orcid":"https://orcid.org/0000-0003-1330-5092"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jyh-Charn Liu","raw_affiliation_strings":["Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Texas A&amp;M University, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5029377307"],"corresponding_institution_ids":["https://openalex.org/I91045830"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14877242,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.7427849769592285},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6862906217575073},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6278887987136841},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.6185622215270996},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5665387511253357},{"id":"https://openalex.org/keywords/subject","display_name":"Subject (documents)","score":0.5477083921432495},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5395819544792175},{"id":"https://openalex.org/keywords/ontology","display_name":"Ontology","score":0.5222597718238831},{"id":"https://openalex.org/keywords/string-searching-algorithm","display_name":"String searching algorithm","score":0.5199888348579407},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.4996018409729004},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22875761985778809},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.18558326363563538},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17733481526374817},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.15937384963035583},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1574585735797882},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1551724672317505},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.09422433376312256}],"concepts":[{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.7427849769592285},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6862906217575073},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6278887987136841},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.6185622215270996},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5665387511253357},{"id":"https://openalex.org/C2777855551","wikidata":"https://www.wikidata.org/wiki/Q12310021","display_name":"Subject (documents)","level":2,"score":0.5477083921432495},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5395819544792175},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.5222597718238831},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.5199888348579407},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.4996018409729004},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22875761985778809},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.18558326363563538},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17733481526374817},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.15937384963035583},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1574585735797882},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1551724672317505},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.09422433376312256},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3342558.3345426","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3342558.3345426","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Symposium on Document Engineering 2019","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W1975258157","https://openalex.org/W1999507153","https://openalex.org/W2563992333","https://openalex.org/W2912070268","https://openalex.org/W3003552288","https://openalex.org/W4229726356"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"Mathematical":[0],"objects":[1],"(MO)":[2],"in":[3,8,15,42,76,88,150,195],"PDF":[4,43,56,77,98,114,136,144,159],"documents":[5,57,99],"is":[6,28,92,110,127,141],"paramount":[7],"understanding":[9],"the":[10,29,95,143,196],"ontology":[11],"and":[12,20,37,58,83,97,145,158],"mathematical":[13,21],"essence":[14],"published":[16],"science,":[17],"technology,":[18],"engineering,":[19],"(STEM)":[22],"documents.":[23,44],"As":[24],"of":[25,71,163,192],"now,":[26],"Marmot":[27],"only":[30],"publicly":[31],"available":[32],"data":[33,68],"set":[34,69,167],"for":[35,186],"optimizing":[36],"evaluating":[38],"MO":[39,52,72,91,133,140],"labeling":[40,51,89],"models":[41],"Thus,":[45],"this":[46],"paper":[47],"proposes":[48],"a":[49,66,101,105,122],"semiautomatic":[50],"algorithm":[53],"that":[54,171,177],"uses":[55],"their":[59,79,156,183],"corresponding":[60],"LaTeX":[61,80,96,117,132,146,157],"source":[62],"files":[63],"to":[64,93,112,129,152,168],"generate":[65],"new":[67],"consisting":[70],"bounding":[73],"boxes":[74],"(Bbox)":[75],"documents,":[78],"equation,":[81],"topic,":[82],"subject.":[84],"The":[85],"first":[86],"step":[87],"each":[90,120,131],"transform":[94],"into":[100],"string":[102],"format.":[103],"Afterwards,":[104],"shortest":[106,124],"unique":[107],"string-matching":[108,125],"technique":[109,126],"proposed":[111],"align":[113,130],"pages":[115,194],"with":[116,134],"files.":[118],"On":[119],"page,":[121],"similar":[123],"employed":[128],"its":[135],"counterpart.":[137],"Once":[138],"an":[139],"located,":[142],"MOs":[147,184],"are":[148,166,172],"normalized":[149],"order":[151],"match":[153],"symbols":[154],"between":[155],"representations.":[160],"A":[161,190],"number":[162],"filtering":[164],"rules":[165,180],"eliminate":[169],"matches":[170],"considered":[173],"exceedingly":[174],"inconsistent.":[175],"Matches":[176],"pass":[178],"these":[179],"will":[181],"have":[182],"highlighted":[185],"final":[187],"manual":[188],"inspection.":[189],"total":[191],"1,802":[193],"high":[197],"energy":[198],"physics":[199],"(hep-th)":[200],"field":[201],"were":[202],"labelled.1":[203]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
