{"id":"https://openalex.org/W4287851300","doi":"https://doi.org/10.1109/spw54247.2022.9833885","title":"A Format-Aware Reducer for Scriptable Rewriting of PDF Files","display_name":"A Format-Aware Reducer for Scriptable Rewriting of PDF Files","publication_year":2022,"publication_date":"2022-05-01","ids":{"openalex":"https://openalex.org/W4287851300","doi":"https://doi.org/10.1109/spw54247.2022.9833885"},"language":"en","primary_location":{"id":"doi:10.1109/spw54247.2022.9833885","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spw54247.2022.9833885","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Security and Privacy Workshops (SPW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087984010","display_name":"Prashant Anantharaman","orcid":"https://orcid.org/0009-0005-5083-4729"},"institutions":[{"id":"https://openalex.org/I107672454","display_name":"Dartmouth College","ror":"https://ror.org/049s0rh22","country_code":"US","type":"education","lineage":["https://openalex.org/I107672454"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Prashant Anantharaman","raw_affiliation_strings":["Dartmouth College,Hanover,NH","Dartmouth College, Hanover, NH"],"affiliations":[{"raw_affiliation_string":"Dartmouth College,Hanover,NH","institution_ids":["https://openalex.org/I107672454"]},{"raw_affiliation_string":"Dartmouth College, Hanover, NH","institution_ids":["https://openalex.org/I107672454"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079175162","display_name":"Steven W. Cheung","orcid":"https://orcid.org/0000-0003-1724-4944"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steven Cheung","raw_affiliation_strings":["SRI International,CA,USA","SRI International, CA, USA"],"affiliations":[{"raw_affiliation_string":"SRI International,CA,USA","institution_ids":["https://openalex.org/I1298353152"]},{"raw_affiliation_string":"SRI International, CA, USA","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079132543","display_name":"Nicholas Boorman","orcid":null},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicholas Boorman","raw_affiliation_strings":["SRI International,CA,USA","SRI International, CA, USA"],"affiliations":[{"raw_affiliation_string":"SRI International,CA,USA","institution_ids":["https://openalex.org/I1298353152"]},{"raw_affiliation_string":"SRI International, CA, USA","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086616243","display_name":"Michael E. Locasto","orcid":null},"institutions":[{"id":"https://openalex.org/I201654770","display_name":"PPG Industries (United States)","ror":"https://ror.org/025h3d465","country_code":"US","type":"company","lineage":["https://openalex.org/I201654770"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael E. Locasto","raw_affiliation_strings":["Narf Industries,NJ,USA","Narf Industries, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Narf Industries,NJ,USA","institution_ids":["https://openalex.org/I201654770"]},{"raw_affiliation_string":"Narf Industries, NJ, USA","institution_ids":["https://openalex.org/I201654770"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5087984010"],"corresponding_institution_ids":["https://openalex.org/I107672454"],"apc_list":null,"apc_paid":null,"fwci":0.1488,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.38580819,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"136","last_page":"151"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11424","display_name":"Security and Verification in Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9036542177200317},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7962281703948975},{"id":"https://openalex.org/keywords/reducer","display_name":"Reducer","score":0.7774105072021484},{"id":"https://openalex.org/keywords/rewriting","display_name":"Rewriting","score":0.7253282070159912},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.6835255026817322},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.6638568639755249},{"id":"https://openalex.org/keywords/abstract-syntax-tree","display_name":"Abstract syntax tree","score":0.5525153875350952},{"id":"https://openalex.org/keywords/serialization","display_name":"Serialization","score":0.4907294511795044},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4318193197250366}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9036542177200317},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7962281703948975},{"id":"https://openalex.org/C2776985865","wikidata":"https://www.wikidata.org/wiki/Q26820931","display_name":"Reducer","level":2,"score":0.7774105072021484},{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.7253282070159912},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.6835255026817322},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6638568639755249},{"id":"https://openalex.org/C58646249","wikidata":"https://www.wikidata.org/wiki/Q127380","display_name":"Abstract syntax tree","level":3,"score":0.5525153875350952},{"id":"https://openalex.org/C52723943","wikidata":"https://www.wikidata.org/wiki/Q1127410","display_name":"Serialization","level":2,"score":0.4907294511795044},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4318193197250366},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C147176958","wikidata":"https://www.wikidata.org/wiki/Q77590","display_name":"Civil engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/spw54247.2022.9833885","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spw54247.2022.9833885","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Security and Privacy Workshops (SPW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W270849871","https://openalex.org/W1893177189","https://openalex.org/W1921030581","https://openalex.org/W1976327390","https://openalex.org/W2030246490","https://openalex.org/W2064452120","https://openalex.org/W2082190528","https://openalex.org/W2083773633","https://openalex.org/W2110986027","https://openalex.org/W2134633067","https://openalex.org/W2140164978","https://openalex.org/W2250653840","https://openalex.org/W2280263187","https://openalex.org/W2401293755","https://openalex.org/W2501098765","https://openalex.org/W2786078377","https://openalex.org/W3008443479","https://openalex.org/W3100284210","https://openalex.org/W3113497636","https://openalex.org/W3116973745","https://openalex.org/W3166537212","https://openalex.org/W3178680414","https://openalex.org/W4239035626","https://openalex.org/W4250353368","https://openalex.org/W6691892052","https://openalex.org/W6748019475"],"related_works":["https://openalex.org/W2077104824","https://openalex.org/W2393678839","https://openalex.org/W1972256049","https://openalex.org/W2501393023","https://openalex.org/W3180820912","https://openalex.org/W2483803551","https://openalex.org/W4285289289","https://openalex.org/W2019401739","https://openalex.org/W2145930257","https://openalex.org/W2168778844"],"abstract_inverted_index":{"Sanitizing":[0],"untrusted":[1],"input":[2,12,28,122],"is":[3,177],"a":[4,19,53,94,106,116,138],"significant":[5],"unsolved":[6],"problem":[7],"in":[8,52],"defensive":[9],"cybersecurity":[10],"and":[11,128,151,191],"handling.":[13],"Even":[14],"if":[15],"we":[16,103,136,160,203],"assume":[17],"that":[18,167],"safe,":[20],"provably":[21],"correct":[22],"parser":[23,42],"exists":[24],"to":[25,62,78,86,97,108,118,126,131,144,165,172],"validate":[26],"the":[27,35,41,49,58,76,82,91,109,148,169,188,201],"syntax,":[29],"processing":[30,59],"logic":[31,60],"may":[32],"still":[33],"require":[34],"application":[36],"of":[37,40,140],"certain":[38],"transformations":[39,120],"output.":[43],"For":[44],"example,":[45],"parsers":[46],"traditionally":[47],"store":[48],"parsed":[50],"objects":[51],"generic":[54],"tree":[55],"structure;":[56],"hence":[57],"needed":[61],"modify":[63,98],"this":[64],"structure":[65,84],"can":[66],"be":[67,145],"significant.":[68],"Also,":[69],"popular":[70,194],"parsing":[71],"tools":[72,143,180,197],"do":[73,198],"not":[74,199],"include":[75],"functionality":[77],"serialize":[79],"(or":[80],"unparse)":[81],"internal":[83],"back":[85],"bytes.This":[87],"paper":[88],"argues":[89],"for":[90,93],"need":[92],"format-aware":[95],"tool":[96,117],"structured":[99],"files.":[100,134],"In":[101],"particular,":[102],"propose":[104],"adding":[105],"reducer":[107,175],"Parsley":[110,114,141],"PDF":[111,133,195],"checker.":[112],"The":[113],"Reducer\u2014":[115],"apply":[119,200],"on":[121],"dynamically\u2014would":[123],"allow":[124],"developers":[125],"design":[127,173],"implement":[129],"rules":[130,176],"transform":[132],"Next,":[135],"describe":[137],"set":[139],"normalization":[142,163],"used":[146],"with":[147],"Reducer":[149],"API":[150],"showcase":[152],"their":[153],"capabilities":[154],"using":[155],"several":[156],"case":[157],"studies.":[158],"Finally,":[159],"evaluate":[161],"our":[162,174],"approach":[164],"demonstrate":[166],"(1)":[168],"developer":[170],"effort":[171],"minimal,":[178],"(2)":[179],"extract":[181],"more":[182],"text":[183],"from":[184],"transformed":[185],"files":[186],"than":[187],"original":[189],"files,":[190],"(3)":[192],"other":[193],"transformation":[196],"corrections":[202],"demonstrate.":[204]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
