{"id":"https://openalex.org/W2963483292","doi":"https://doi.org/10.1145/3314344.3332496","title":"Examining the challenges in development data pipeline","display_name":"Examining the challenges in development data pipeline","publication_year":2019,"publication_date":"2019-07-03","ids":{"openalex":"https://openalex.org/W2963483292","doi":"https://doi.org/10.1145/3314344.3332496","mag":"2963483292"},"language":"en","primary_location":{"id":"doi:10.1145/3314344.3332496","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3314344.3332496","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd ACM SIGCAS Conference on Computing and Sustainable Societies","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033048336","display_name":"Fahad Pervaiz","orcid":"https://orcid.org/0000-0003-1941-082X"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fahad Pervaiz","raw_affiliation_strings":["University of Washington"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Washington","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072922547","display_name":"Aditya Vashistha","orcid":"https://orcid.org/0000-0001-5693-3326"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aditya Vashistha","raw_affiliation_strings":["University of Washington"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Washington","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076685799","display_name":"Richard Anderson","orcid":"https://orcid.org/0000-0002-7283-7219"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Richard Anderson","raw_affiliation_strings":["University of Washington"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Washington","institution_ids":["https://openalex.org/I201448701"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.232,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.9480327,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"13","last_page":"21"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.9810000061988831,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10953","display_name":"E-Government and Public Services","score":0.9733999967575073,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6357945799827576},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.6096587181091309},{"id":"https://openalex.org/keywords/data-governance","display_name":"Data governance","score":0.5879396200180054},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.5353444218635559},{"id":"https://openalex.org/keywords/government","display_name":"Government (linguistics)","score":0.5283703804016113},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5270683765411377},{"id":"https://openalex.org/keywords/open-data","display_name":"Open data","score":0.4805781841278076},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.47574377059936523},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4749370217323303},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4679946303367615},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.39715543389320374},{"id":"https://openalex.org/keywords/process-management","display_name":"Process management","score":0.3739061951637268},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.30774372816085815},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.28145015239715576},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18081173300743103},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.17492690682411194},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.11252111196517944},{"id":"https://openalex.org/keywords/marketing","display_name":"Marketing","score":0.10314053297042847}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6357945799827576},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6096587181091309},{"id":"https://openalex.org/C196879817","wikidata":"https://www.wikidata.org/wiki/Q872685","display_name":"Data governance","level":4,"score":0.5879396200180054},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.5353444218635559},{"id":"https://openalex.org/C2778137410","wikidata":"https://www.wikidata.org/wiki/Q2732820","display_name":"Government (linguistics)","level":2,"score":0.5283703804016113},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5270683765411377},{"id":"https://openalex.org/C2780535194","wikidata":"https://www.wikidata.org/wiki/Q309901","display_name":"Open data","level":2,"score":0.4805781841278076},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.47574377059936523},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4749370217323303},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4679946303367615},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.39715543389320374},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.3739061951637268},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.30774372816085815},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.28145015239715576},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18081173300743103},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.17492690682411194},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.11252111196517944},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.10314053297042847},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3314344.3332496","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3314344.3332496","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd ACM SIGCAS Conference on Computing and Sustainable Societies","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W25706487","https://openalex.org/W185683210","https://openalex.org/W642006801","https://openalex.org/W1479965084","https://openalex.org/W1502624642","https://openalex.org/W1516293359","https://openalex.org/W1530124122","https://openalex.org/W1547612978","https://openalex.org/W1551385575","https://openalex.org/W1610496399","https://openalex.org/W1740243371","https://openalex.org/W1979290264","https://openalex.org/W2002752983","https://openalex.org/W2004634429","https://openalex.org/W2016878687","https://openalex.org/W2022592150","https://openalex.org/W2028251458","https://openalex.org/W2036309921","https://openalex.org/W2041439319","https://openalex.org/W2046797334","https://openalex.org/W2051508205","https://openalex.org/W2055049468","https://openalex.org/W2064766209","https://openalex.org/W2080731889","https://openalex.org/W2106895292","https://openalex.org/W2108991785","https://openalex.org/W2114793173","https://openalex.org/W2131576956","https://openalex.org/W2169454125","https://openalex.org/W2342249984","https://openalex.org/W2516470118","https://openalex.org/W2915412380","https://openalex.org/W3099883947","https://openalex.org/W3146259567","https://openalex.org/W4213342056","https://openalex.org/W4229650163","https://openalex.org/W4235243453","https://openalex.org/W4242428206","https://openalex.org/W4401946675","https://openalex.org/W6636177537","https://openalex.org/W6676014748"],"related_works":["https://openalex.org/W4389473037","https://openalex.org/W2899425562","https://openalex.org/W2910106972","https://openalex.org/W4386462015","https://openalex.org/W3015446482","https://openalex.org/W1580000338","https://openalex.org/W1597628794","https://openalex.org/W3204021274","https://openalex.org/W2338543293","https://openalex.org/W3185796454"],"abstract_inverted_index":{"The":[0],"developing":[1],"world":[2],"has":[3],"increasingly":[4],"relied":[5],"on":[6],"data":[7,17,41,60,67,86,116,131,142,155,175,182],"driven":[8],"policies.":[9],"Numerous":[10],"development":[11,22,85,104,130],"agencies":[12],"have":[13,28],"pushed":[14],"for":[15,33,186],"on-ground":[16],"collection":[18],"to":[19,69,95,172,177],"support":[20,70,162],"the":[21,38,74,81,121,166,169,180],"work":[23],"they":[24],"pursue.":[25],"Many":[26],"governments":[27],"launched":[29],"their":[30],"own":[31],"efforts":[32],"frequent":[34],"information":[35],"gathering.":[36],"Overall,":[37],"amount":[39],"of":[40,55,73,83,98,120,154],"collected":[42],"is":[43,171],"tremendous,":[44],"yet":[45],"there":[46],"are":[47],"significant":[48],"issues":[49],"in":[50,59,128],"doing":[51],"useful":[52],"analysis.":[53,75,187],"Most":[54],"these":[56],"barriers":[57],"manifest":[58],"cleaning":[61,84,156,183],"and":[62,64,106,115,140,158,184],"merging,":[63],"require":[65],"a":[66,151],"engineer":[68],"some":[71],"parts":[72],"In":[76],"this":[77],"paper,":[78],"we":[79,123],"investigate":[80],"challenges":[82,126],"through":[87],"an":[88],"interview":[89],"based":[90],"study.":[91],"We":[92,149],"conducted":[93],"face":[94,96],"interviews":[97,122],"13":[99],"stakeholders,":[100],"eight":[101],"from":[102,110,143],"international":[103],"organizations":[105],"five":[107],"government":[108],"workers":[109],"Pakistan,":[111],"including":[112,132],"both":[113],"managers":[114],"analysts.":[117],"From":[118],"analysis":[119],"identified":[124],"common":[125],"faced":[127],"processing":[129],"correcting":[133],"open":[134],"text":[135],"fields,":[136],"merging":[137],"hierarchical":[138],"data,":[139],"extracting":[141],"textual":[144],"formats":[145],"such":[146],"as":[147],"PDF.":[148],"construct":[150],"basic":[152],"taxonomy":[153],"challenges,":[157],"identify":[159],"areas":[160],"where":[161],"tools":[163],"can":[164],"improve":[165],"process.":[167],"Ultimately,":[168],"objective":[170],"empower":[173],"regular":[174],"users":[176],"easily":[178],"do":[179],"necessary":[181],"scrubbing":[185]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
