{"id":"https://openalex.org/W2147934301","doi":"https://doi.org/10.1145/1099554.1099682","title":"Automated cleansing for spend analytics","display_name":"Automated cleansing for spend analytics","publication_year":2005,"publication_date":"2005-10-31","ids":{"openalex":"https://openalex.org/W2147934301","doi":"https://doi.org/10.1145/1099554.1099682","mag":"2147934301"},"language":"en","primary_location":{"id":"doi:10.1145/1099554.1099682","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1099554.1099682","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th ACM international conference on Information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110922516","display_name":"Moninder Singh","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Moninder Singh","raw_affiliation_strings":["IBM Thomas J. Watson Research Center, Yorktown Heights, NY"],"affiliations":[{"raw_affiliation_string":"IBM Thomas J. Watson Research Center, Yorktown Heights, NY","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057936833","display_name":"Jayant Kalagnanam","orcid":"https://orcid.org/0009-0009-5051-2606"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jayant R. Kalagnanam","raw_affiliation_strings":["IBM Thomas J. Watson Research Center, Yorktown Heights, NY"],"affiliations":[{"raw_affiliation_string":"IBM Thomas J. Watson Research Center, Yorktown Heights, NY","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087328826","display_name":"Sudhir Verma","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sudhir Verma","raw_affiliation_strings":["IBM Thomas J. Watson Research Center, Yorktown Heights, NY"],"affiliations":[{"raw_affiliation_string":"IBM Thomas J. Watson Research Center, Yorktown Heights, NY","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110252219","display_name":"Amit Shah","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amit J. Shah","raw_affiliation_strings":["IBM Thomas J. Watson Research Center, Yorktown Heights, NY"],"affiliations":[{"raw_affiliation_string":"IBM Thomas J. Watson Research Center, Yorktown Heights, NY","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023867820","display_name":"Swaroop K. Chalasani","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Swaroop K. Chalasani","raw_affiliation_strings":["IBM Thomas J. Watson Research Center, Yorktown Heights, NY"],"affiliations":[{"raw_affiliation_string":"IBM Thomas J. Watson Research Center, Yorktown Heights, NY","institution_ids":["https://openalex.org/I4210114115"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5110922516"],"corresponding_institution_ids":["https://openalex.org/I4210114115"],"apc_list":null,"apc_paid":null,"fwci":0.435,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.70772203,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"437","last_page":"445"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11912","display_name":"Outsourcing and Supply Chain Management","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9803000092506409,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/database-transaction","display_name":"Database transaction","score":0.6834397315979004},{"id":"https://openalex.org/keywords/procurement","display_name":"Procurement","score":0.6597117781639099},{"id":"https://openalex.org/keywords/transaction-data","display_name":"Transaction data","score":0.6021122932434082},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5970947742462158},{"id":"https://openalex.org/keywords/purchase-order","display_name":"Purchase order","score":0.5776547193527222},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.5594639778137207},{"id":"https://openalex.org/keywords/online-analytical-processing","display_name":"Online analytical processing","score":0.5481685400009155},{"id":"https://openalex.org/keywords/outsourcing","display_name":"Outsourcing","score":0.5208947658538818},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.465678870677948},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.4263855218887329},{"id":"https://openalex.org/keywords/business-intelligence","display_name":"Business intelligence","score":0.41843557357788086},{"id":"https://openalex.org/keywords/transactional-leadership","display_name":"Transactional leadership","score":0.41636160016059875},{"id":"https://openalex.org/keywords/commodity","display_name":"Commodity","score":0.4105663299560547},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.40331876277923584},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.4028928577899933},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.33358293771743774},{"id":"https://openalex.org/keywords/purchasing","display_name":"Purchasing","score":0.2895094156265259},{"id":"https://openalex.org/keywords/data-warehouse","display_name":"Data warehouse","score":0.28595754504203796},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.2833865284919739},{"id":"https://openalex.org/keywords/marketing","display_name":"Marketing","score":0.2047327756881714},{"id":"https://openalex.org/keywords/finance","display_name":"Finance","score":0.13144081830978394}],"concepts":[{"id":"https://openalex.org/C75949130","wikidata":"https://www.wikidata.org/wiki/Q848010","display_name":"Database transaction","level":2,"score":0.6834397315979004},{"id":"https://openalex.org/C201650216","wikidata":"https://www.wikidata.org/wiki/Q829492","display_name":"Procurement","level":2,"score":0.6597117781639099},{"id":"https://openalex.org/C127722929","wikidata":"https://www.wikidata.org/wiki/Q7833714","display_name":"Transaction data","level":3,"score":0.6021122932434082},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5970947742462158},{"id":"https://openalex.org/C134418285","wikidata":"https://www.wikidata.org/wiki/Q643327","display_name":"Purchase order","level":3,"score":0.5776547193527222},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.5594639778137207},{"id":"https://openalex.org/C201932085","wikidata":"https://www.wikidata.org/wiki/Q642514","display_name":"Online analytical processing","level":3,"score":0.5481685400009155},{"id":"https://openalex.org/C46934059","wikidata":"https://www.wikidata.org/wiki/Q61515","display_name":"Outsourcing","level":2,"score":0.5208947658538818},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.465678870677948},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.4263855218887329},{"id":"https://openalex.org/C2767350","wikidata":"https://www.wikidata.org/wiki/Q6662173","display_name":"Business intelligence","level":2,"score":0.41843557357788086},{"id":"https://openalex.org/C68489960","wikidata":"https://www.wikidata.org/wiki/Q2370659","display_name":"Transactional leadership","level":2,"score":0.41636160016059875},{"id":"https://openalex.org/C2779439359","wikidata":"https://www.wikidata.org/wiki/Q317088","display_name":"Commodity","level":2,"score":0.4105663299560547},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.40331876277923584},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.4028928577899933},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.33358293771743774},{"id":"https://openalex.org/C2778813691","wikidata":"https://www.wikidata.org/wiki/Q1369832","display_name":"Purchasing","level":2,"score":0.2895094156265259},{"id":"https://openalex.org/C135572916","wikidata":"https://www.wikidata.org/wiki/Q193351","display_name":"Data warehouse","level":2,"score":0.28595754504203796},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.2833865284919739},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.2047327756881714},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.13144081830978394},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1099554.1099682","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1099554.1099682","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th ACM international conference on Information and knowledge management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W202303397","https://openalex.org/W1550206324","https://openalex.org/W1602152045","https://openalex.org/W1647671624","https://openalex.org/W1660390307","https://openalex.org/W1978394996","https://openalex.org/W2001496424","https://openalex.org/W2036216970","https://openalex.org/W2099942883","https://openalex.org/W2123402141","https://openalex.org/W2149684865","https://openalex.org/W2998380892"],"related_works":["https://openalex.org/W871714347","https://openalex.org/W1202170028","https://openalex.org/W208715492","https://openalex.org/W2186969963","https://openalex.org/W2994505632","https://openalex.org/W2586269375","https://openalex.org/W2072434258","https://openalex.org/W3082564695","https://openalex.org/W23190051","https://openalex.org/W4229708142"],"abstract_inverted_index":{"The":[0,57],"development":[1],"of":[2,6,35,64,75,102,119,124,130,183,240,289,298,307],"an":[3,11,99,121,191,252,295],"aggregate":[4],"view":[5,101,123,194,297],"the":[7,37,62,72,117,128,147,166,173,187,207,216,229,238,246,305],"procurement":[8,111,125],"spend":[9,103,126,193],"across":[10,104,140],"enterprise":[12,38],"using":[13,261],"transactional":[14,152,291],"data":[15,133,138,153,199,248,292],"is":[16,39,68,224,302],"increasingly":[17],"becoming":[18],"a":[19,30,131,282],"very":[20],"important":[21],"and":[22,32,41,112,143,179,210,266,273,286,293],"strategic":[23],"activity.":[24],"Not":[25],"only":[26],"does":[27],"it":[28,44,47,232],"provide":[29],"complete":[31],"accurate":[33,285],"picture":[34],"what":[36],"buying":[40],"from":[42,135,154,263],"whom,":[43],"also":[45],"allows":[46],"to":[48,91,97,109,172,201,205,215,234,255],"consolidate":[49],"suppliers,":[50],"as":[51,53,59,61,88,158],"well":[52,60],"negotiate":[54],"better":[55],"prices.":[56],"importance,":[58],"complexity,":[63],"this":[65,198,258,277],"cleansing":[66,259,290],"exercise":[67],"further":[69],"magnified":[70],"by":[71,176,228,310],"increasing":[73],"popularity":[74],"Business":[76],"Transformation":[77],"Outsourcing":[78],"(BTO)":[79],"wherein":[80],"enterprises":[81,106,280],"are":[82,168],"turning":[83],"over":[84],"non-core":[85],"activities,":[86],"such":[87,120,157],"indirect":[89],"procurement,":[90],"third":[92],"parties,":[93],"who":[94],"now":[95],"need":[96],"develop":[98],"integrated":[100,122,296],"multiple":[105],"in":[107,222,245,304,314],"order":[108],"optimize":[110],"generate":[113],"maximum":[114],"savings.":[115],"However,":[116],"creation":[118,129],"requires":[127],"homogeneous":[132],"repository":[134],"disparate":[136],"(heterogeneous)":[137],"sources":[139,156],"various":[141,155,247],"geographic":[142],"functional":[144],"organizations":[145],"throughout":[146],"enterprise(s).":[148],"Such":[149],"repositories":[150],"get":[151],"invoices,":[159],"purchase":[160],"orders,":[161],"account":[162],"ledgers.":[163],"As":[164],"such,":[165],"transactions":[167],"not":[169],"cross-indexed,":[170],"refer":[171],"same":[174,188],"suppliers":[175],"different":[177,181],"names,":[178],"use":[180,313],"ways":[182],"representing":[184],"information":[185,264],"about":[186],"commodities.":[189],"Before":[190],"aggregated":[192],"can":[195],"be":[196,202,235],"developed,":[197],"needs":[200],"cleansed,":[203],"primarily":[204],"normalize":[206],"supplier":[208],"names":[209],"correctly":[211],"map":[212],"each":[213],"transaction":[214],"appropriate":[217],"commodity":[218],"code.":[219],"Commodity":[220],"mapping,":[221],"particular,":[223],"made":[225],"more":[226],"difficult":[227],"fact":[230],"that":[231],"has":[233],"done":[236],"on":[237,270],"basis":[239],"unstructured":[241],"text":[242],"descriptions":[243],"found":[244],"sources.":[249],"We":[250],"describe":[251],"on-demand":[253,287],"system":[254,278,301],"automatically":[256],"perform":[257],"activity":[260],"techniques":[262],"retrieval":[265],"machine":[267],"learning.":[268],"Built":[269],"standard":[271],"integration":[272],"application":[274],"infrastructure":[275],"software,":[276],"provides":[279],"with":[281],"fast,":[283],"reliable,":[284],"way":[288],"generating":[294],"spend.":[299],"This":[300],"currently":[303],"process":[306],"being":[308],"deployed":[309],"IBM":[311],"for":[312],"its":[315],"BTO":[316],"practice.":[317]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
