{"id":"https://openalex.org/W3022563068","doi":"https://doi.org/10.1145/3371300.3383351","title":"Towards generating web-accessible STEM documents from PDF","display_name":"Towards generating web-accessible STEM documents from PDF","publication_year":2020,"publication_date":"2020-04-20","ids":{"openalex":"https://openalex.org/W3022563068","doi":"https://doi.org/10.1145/3371300.3383351","mag":"3022563068"},"language":"en","primary_location":{"id":"doi:10.1145/3371300.3383351","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3371300.3383351","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th International Web for All Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043436240","display_name":"Volker Sorge","orcid":"https://orcid.org/0000-0003-2796-1488"},"institutions":[{"id":"https://openalex.org/I79619799","display_name":"University of Birmingham","ror":"https://ror.org/03angcq70","country_code":"GB","type":"education","lineage":["https://openalex.org/I79619799"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Volker Sorge","raw_affiliation_strings":["University of Birmingham, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Birmingham, UK","institution_ids":["https://openalex.org/I79619799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066310804","display_name":"Akashdeep Bansal","orcid":null},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Akashdeep Bansal","raw_affiliation_strings":["IIT Delhi"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IIT Delhi","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038747880","display_name":"Neha Jadhav","orcid":"https://orcid.org/0009-0005-5464-3559"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Neha M Jadhav","raw_affiliation_strings":["IIT Delhi"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IIT Delhi","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020917402","display_name":"Himanshu Garg","orcid":null},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Himanshu Garg","raw_affiliation_strings":["IIT Delhi"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IIT Delhi","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104075576","display_name":"Ayushi Verma","orcid":"https://orcid.org/0000-0003-1160-1357"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Ayushi Verma","raw_affiliation_strings":["IIT Delhi"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IIT Delhi","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102857440","display_name":"S. Balakrishnan","orcid":"https://orcid.org/0009-0000-2568-0151"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"M Balakrishnan","raw_affiliation_strings":["IIT Delhi"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IIT Delhi","institution_ids":["https://openalex.org/I68891433"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.1655,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.83260044,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12171","display_name":"Open Education and E-Learning","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9763000011444092,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8236664533615112},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.6071441769599915},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5960793495178223},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5479968190193176},{"id":"https://openalex.org/keywords/file-format","display_name":"File format","score":0.5060777068138123},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3473961353302002},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.23672452569007874}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8236664533615112},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.6071441769599915},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5960793495178223},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5479968190193176},{"id":"https://openalex.org/C97250363","wikidata":"https://www.wikidata.org/wiki/Q235557","display_name":"File format","level":2,"score":0.5060777068138123},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3473961353302002},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.23672452569007874},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3371300.3383351","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3371300.3383351","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th International Web for All Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/625b82c9-19ce-4d6c-bd17-70cc691e3d76","is_oa":false,"landing_page_url":"https://research.birmingham.ac.uk/en/publications/625b82c9-19ce-4d6c-bd17-70cc691e3d76","pdf_url":null,"source":{"id":"https://openalex.org/S4306402634","display_name":"University of Birmingham Research Portal (University of Birmingham)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79619799","host_organization_name":"University of Birmingham","host_organization_lineage":["https://openalex.org/I79619799"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sorge, V, Bansal, A, Jadhav, N M, Garg, H, Verma, A & Balakrishnan, M 2020, Towards generating web-accessible STEM documents from PDF. in Proceedings of the 17th International Web for All Conference, W4A 2020. Proceedings of the 17th International Web for All Conference, W4A 2020, Association for Computing Machinery , 17th International Web for All Conference, W4A 2020, Taipei, Taiwan, Province of China, 20/04/20. https://doi.org/10.1145/3371300.3383351","raw_type":"contributionToPeriodical"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W69001340","https://openalex.org/W139731185","https://openalex.org/W2144209937","https://openalex.org/W2346371394","https://openalex.org/W2501572931","https://openalex.org/W2896060357"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2357241418","https://openalex.org/W2086064646","https://openalex.org/W2119135658","https://openalex.org/W2115485936","https://openalex.org/W3022131925","https://openalex.org/W2349174110","https://openalex.org/W1597238586","https://openalex.org/W1536405386","https://openalex.org/W2326857978"],"abstract_inverted_index":{"PDF":[0,28,55,79],"is":[1,8,44],"still":[2,32],"a":[3,72],"very":[4],"popular":[5],"format":[6,56],"that":[7],"widely":[9],"used":[10],"to":[11,24,77,113],"exchange":[12],"and":[13,58,96,109],"archive":[14],"electronic":[15],"documents.":[16],"And":[17],"although":[18],"considerable":[19],"efforts":[20],"have":[21],"been":[22],"made":[23],"ensure":[25],"accessibility":[26],"of":[27,102],"documents,":[29],"they":[30],"are":[31,52,59],"far":[33],"from":[34],"ideal":[35],"when":[36],"complex":[37],"content":[38],"like":[39],"formulas,":[40],"diagrams":[41],"or":[42],"tables":[43,97],"present.":[45],"Unfortunately,":[46],"many":[47],"publications":[48],"in":[49,54,106,116],"scientific":[50],"subjects":[51],"available":[53],"only":[57,64],"therefore,":[60],"if":[61],"at":[62],"all,":[63],"partially":[65],"accessible.":[66],"In":[67],"this":[68,107],"paper,":[69],"we":[70,111],"present":[71],"fully":[73],"automated":[74],"web-based":[75],"technology":[76],"convert":[78],"documents":[80],"into":[81],"an":[82],"accessible":[83],"single":[84],"file":[85],"format.":[86],"We":[87],"concentrate":[88],"on":[89],"presenting":[90],"working":[91],"solutions":[92],"for":[93],"mathematical":[94],"formulas":[95],"while":[98],"also":[99],"discussing":[100],"some":[101],"the":[103,117],"open":[104],"problems":[105],"context":[108],"how":[110],"aim":[112],"solve":[114],"them":[115],"future.":[118]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
