{"id":"https://openalex.org/W4313150562","doi":"https://doi.org/10.1109/mahc.2022.3214736","title":"Challenges of Large-Scale Data Processing in the 1990s: The IPUMS Experience","display_name":"Challenges of Large-Scale Data Processing in the 1990s: The IPUMS Experience","publication_year":2022,"publication_date":"2022-10-01","ids":{"openalex":"https://openalex.org/W4313150562","doi":"https://doi.org/10.1109/mahc.2022.3214736","pmid":"https://pubmed.ncbi.nlm.nih.gov/37159752"},"language":"en","primary_location":{"id":"doi:10.1109/mahc.2022.3214736","is_oa":true,"landing_page_url":"https://doi.org/10.1109/mahc.2022.3214736","pdf_url":"https://ieeexplore.ieee.org/ielx7/85/9972843/09972862.pdf","source":{"id":"https://openalex.org/S118545620","display_name":"IEEE Annals of the History of Computing","issn_l":"1058-6180","issn":["1058-6180","1934-1547"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Annals of the History of Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/85/9972843/09972862.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010136783","display_name":"Diana L. Magnuson","orcid":"https://orcid.org/0000-0002-8729-5109"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Diana L. Magnuson","raw_affiliation_strings":["Institute for Social Research and Data Innovation, University of Minnesota, Minneapolis, MN, USA"],"affiliations":[{"raw_affiliation_string":"Institute for Social Research and Data Innovation, University of Minnesota, Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059262480","display_name":"Steven Ruggles","orcid":"https://orcid.org/0000-0001-5353-2578"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steven Ruggles","raw_affiliation_strings":["Institute for Social Research and Data Innovation, University of Minnesota, Minneapolis, MN, USA"],"affiliations":[{"raw_affiliation_string":"Institute for Social Research and Data Innovation, University of Minnesota, Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5010136783"],"corresponding_institution_ids":["https://openalex.org/I130238516"],"apc_list":null,"apc_paid":null,"fwci":0.5086,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.7000804,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"44","issue":"4","first_page":"71","last_page":"83"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9695000052452087,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9695000052452087,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14201","display_name":"Data Analysis and Archiving","score":0.9614999890327454,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interoperability","display_name":"Interoperability","score":0.7488871216773987},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6410998106002808},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.6162964701652527},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.5456902980804443},{"id":"https://openalex.org/keywords/dissemination","display_name":"Dissemination","score":0.5255956649780273},{"id":"https://openalex.org/keywords/data-processing","display_name":"Data processing","score":0.4389594793319702},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3342326283454895},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.29440218210220337},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.20336955785751343}],"concepts":[{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.7488871216773987},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6410998106002808},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6162964701652527},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.5456902980804443},{"id":"https://openalex.org/C101780184","wikidata":"https://www.wikidata.org/wiki/Q840576","display_name":"Dissemination","level":2,"score":0.5255956649780273},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.4389594793319702},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3342326283454895},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.29440218210220337},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.20336955785751343},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/mahc.2022.3214736","is_oa":true,"landing_page_url":"https://doi.org/10.1109/mahc.2022.3214736","pdf_url":"https://ieeexplore.ieee.org/ielx7/85/9972843/09972862.pdf","source":{"id":"https://openalex.org/S118545620","display_name":"IEEE Annals of the History of Computing","issn_l":"1058-6180","issn":["1058-6180","1934-1547"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Annals of the History of Computing","raw_type":"journal-article"},{"id":"pmid:37159752","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37159752","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE annals of the history of computing","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:10163666","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/10163666","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC10163666/pdf/nihms-1876168.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Ann Hist Comput","raw_type":"Text"},{"id":"pmh:oai:muse.jhu.edu:/article/876944","is_oa":false,"landing_page_url":"https://muse.jhu.edu/pub/87/article/876944","pdf_url":null,"source":{"id":"https://openalex.org/S4377196299","display_name":"Project Muse (Johns Hopkins University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I145311948","host_organization_name":"Johns Hopkins University","host_organization_lineage":["https://openalex.org/I145311948"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"}],"best_oa_location":{"id":"doi:10.1109/mahc.2022.3214736","is_oa":true,"landing_page_url":"https://doi.org/10.1109/mahc.2022.3214736","pdf_url":"https://ieeexplore.ieee.org/ielx7/85/9972843/09972862.pdf","source":{"id":"https://openalex.org/S118545620","display_name":"IEEE Annals of the History of Computing","issn_l":"1058-6180","issn":["1058-6180","1934-1547"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Annals of the History of Computing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6700000166893005,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4313150562.pdf","grobid_xml":"https://content.openalex.org/works/W4313150562.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W107887801","https://openalex.org/W1968741932","https://openalex.org/W1992119663","https://openalex.org/W2019355382","https://openalex.org/W2032855437","https://openalex.org/W2044956429","https://openalex.org/W2051470211","https://openalex.org/W2069262531","https://openalex.org/W2085946510","https://openalex.org/W2315790022","https://openalex.org/W2316354681","https://openalex.org/W2329327294","https://openalex.org/W2607866088","https://openalex.org/W2610970203","https://openalex.org/W2810329883","https://openalex.org/W2810636282","https://openalex.org/W3037271110","https://openalex.org/W3120724860","https://openalex.org/W4247380411","https://openalex.org/W4253027308","https://openalex.org/W6604267005","https://openalex.org/W6736987211","https://openalex.org/W6982712541"],"related_works":["https://openalex.org/W2093262417","https://openalex.org/W2123131699","https://openalex.org/W2618286804","https://openalex.org/W2374084962","https://openalex.org/W913131694","https://openalex.org/W2329643025","https://openalex.org/W2978405156","https://openalex.org/W650116260","https://openalex.org/W2378329187","https://openalex.org/W2965679711"],"abstract_inverted_index":{"When":[0],"it":[1],"was":[2,33,41,65],"launched":[3],"in":[4,95,157],"1991,":[5],"the":[6,73,90,96,107,126,129,151,158],"Integrated":[7],"Public":[8],"Use":[9],"Microdata":[10],"Series":[11],"(IPUMS)":[12],"project":[13],"faced":[14,76],"a":[15,114,134,147],"challenging":[16],"environment":[17,132],"and":[18,25,44,84,105,120,162],"limited":[19],"resources.":[20],"Few":[21],"datasets":[22,40],"were":[23,57],"interoperable":[24],"much":[26],"data":[27,56,81,167],"collected":[28],"at":[29],"great":[30],"public":[31],"expense":[32],"inaccessible":[34],"to":[35,52,67,100,102,124,165],"most":[36],"researchers.":[37],"Documentation":[38],"of":[39,79,116,128,136,142,146,150,153],"nonstandardized,":[42],"incomplete,":[43],"inadequate":[45,80],"for":[46],"automated":[47],"processing.":[48],"With":[49],"insufficient":[50],"attention":[51],"preservation,":[53],"valuable":[54],"scientific":[55],"disappearing":[58],"(see":[59],"Bogue":[60],"et":[61],"al.,":[62],"1976).":[63],"IPUMS":[64,75,130,143],"established":[66],"address":[68],"these":[69],"critical":[70],"issues.":[71],"At":[72],"outset,":[74],"daunting":[77],"barriers":[78],"processing,":[82],"storage,":[83],"network":[85],"capacity.":[86],"This":[87],"anecdote":[88],"describes":[89],"improvised":[91],"computational":[92],"infrastructure":[93,156],"developed":[94],"decade":[97],"from":[98],"1989":[99],"1999":[101],"process,":[103],"manage,":[104],"disseminate":[106],"world's":[108],"largest":[109],"population":[110],"datasets.":[111],"We":[112],"use":[113],"combination":[115],"archival":[117],"sources,":[118],"interviews,":[119],"our":[121],"own":[122],"memories":[123],"trace":[125],"development":[127,141,152],"computing":[131],"during":[133],"period":[135],"explosive":[137],"technical":[138],"innovation.":[139],"The":[140],"is":[144],"part":[145],"larger":[148],"story":[149],"social":[154],"science":[155],"late":[159],"20th":[160],"century":[161],"its":[163],"contribution":[164],"democratizing":[166],"access.":[168]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
