{"id":"https://openalex.org/W2144790020","doi":"https://doi.org/10.1109/tkde.2003.1209004","title":"Searching with numbers","display_name":"Searching with numbers","publication_year":2003,"publication_date":"2003-07-01","ids":{"openalex":"https://openalex.org/W2144790020","doi":"https://doi.org/10.1109/tkde.2003.1209004","mag":"2144790020"},"language":"en","primary_location":{"id":"doi:10.1109/tkde.2003.1209004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2003.1209004","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103154659","display_name":"R. K. Agrawal","orcid":"https://orcid.org/0000-0003-3122-5096"},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"R. Agrawal","raw_affiliation_strings":["IBM Almaden Research Center, San Jose, CA, USA","IBM Almaden Research Center, San Jose, CA USA"],"affiliations":[{"raw_affiliation_string":"IBM Almaden Research Center, San Jose, CA, USA","institution_ids":["https://openalex.org/I4210085935"]},{"raw_affiliation_string":"IBM Almaden Research Center, San Jose, CA USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042887703","display_name":"Ramakrishnan Srikant","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"R. Srikant","raw_affiliation_strings":["IBM Almaden Research Center, San Jose, CA, USA","IBM Almaden Research Center, San Jose, CA USA"],"affiliations":[{"raw_affiliation_string":"IBM Almaden Research Center, San Jose, CA, USA","institution_ids":["https://openalex.org/I4210085935"]},{"raw_affiliation_string":"IBM Almaden Research Center, San Jose, CA USA","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5103154659"],"corresponding_institution_ids":["https://openalex.org/I1341412227","https://openalex.org/I4210085935"],"apc_list":null,"apc_paid":null,"fwci":0.2928,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.59591014,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"15","issue":"4","first_page":"855","last_page":"870"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8702315092086792},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.7285812497138977},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6807793378829956},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5051911473274231},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.46687954664230347},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.46598783135414124},{"id":"https://openalex.org/keywords/fraction","display_name":"Fraction (chemistry)","score":0.4610303044319153},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24458426237106323}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8702315092086792},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.7285812497138977},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6807793378829956},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5051911473274231},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.46687954664230347},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.46598783135414124},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.4610303044319153},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24458426237106323},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tkde.2003.1209004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2003.1209004","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1833785989","https://openalex.org/W1972978715","https://openalex.org/W2005649826","https://openalex.org/W2007278710","https://openalex.org/W2015914309","https://openalex.org/W2018177083","https://openalex.org/W2036705516","https://openalex.org/W2039995466","https://openalex.org/W2046144220","https://openalex.org/W2051834357","https://openalex.org/W2086174602","https://openalex.org/W2132082507","https://openalex.org/W2134206624","https://openalex.org/W2141649964","https://openalex.org/W2147152072","https://openalex.org/W2147717514","https://openalex.org/W2153752143","https://openalex.org/W2161694911","https://openalex.org/W2168160104","https://openalex.org/W2666600683","https://openalex.org/W3003338753","https://openalex.org/W3164674465","https://openalex.org/W6680863237","https://openalex.org/W6682468365"],"related_works":["https://openalex.org/W3024364549","https://openalex.org/W4206019083","https://openalex.org/W2048865712","https://openalex.org/W1976265003","https://openalex.org/W2370378377","https://openalex.org/W2032233321","https://openalex.org/W3121970507","https://openalex.org/W4237510188","https://openalex.org/W2110028391","https://openalex.org/W2130160813"],"abstract_inverted_index":{"A":[0],"large":[1],"fraction":[2],"of":[3,9,15,56,59,175],"the":[4,36,57,82,94,97,106,113,123],"useful":[5],"Web":[6],"is":[7],"comprised":[8],"specification":[10],"documents":[11,41],"that":[12,71,160],"largely":[13],"consist":[14],"(attribute":[16],"name,":[17],"numeric":[18],"value)":[19],"pairs":[20],"embedded":[21],"in":[22,35,96,112,165],"text.":[23,65],"Examples":[24],"include":[25],"product":[26],"information,":[27],"classified":[28],"advertisements,":[29],"resumes,":[30],"etc.":[31],"The":[32],"approach":[33,70,144,157],"taken":[34],"past":[37],"to":[38,77],"search":[39,91],"these":[40],"by":[42,158],"first":[43],"establishing":[44],"correspondences":[45],"between":[46],"values":[47,95],"and":[48,105,118],"their":[49],"names":[50,104,111],"has":[51,84,108],"achieved":[52],"limited":[53],"success":[54],"because":[55],"difficulty":[58],"extracting":[60],"this":[61,75],"information":[62],"from":[63,134,172],"free":[64],"We":[66,115,125],"propose":[67],"a":[68,173],"new":[69],"does":[72],"not":[73,100],"require":[74],"correspondence":[76],"be":[78,140],"accurately":[79],"established.":[80],"Provided":[81],"data":[83,98,136,151,170],"\"low":[85],"reflectivity\",":[86],"we":[87,154,161],"can":[88,139],"do":[89],"effective":[90],"even":[92],"if":[93],"have":[99],"been":[101],"assigned":[102],"attribute":[103,110],"user":[107],"omitted":[109],"query.":[114],"give":[116],"algorithms":[117],"indexing":[119],"structures":[120],"for":[121,145],"implementing":[122],"search.":[124],"also":[126],"show":[127],"how":[128],"hints":[129],"(i.e.,":[130],"imprecise,":[131],"partial":[132],"correspondences)":[133],"automatic":[135],"extraction":[137],"techniques":[138],"incorporated":[141],"into":[142],"our":[143,156,166],"better":[146],"accuracy":[147],"on":[148,168],"high":[149,163],"reflectivity":[150],"sets.":[152],"Finally,":[153],"validate":[155],"showing":[159],"get":[162],"precision":[164],"answers":[167],"real":[169],"sets":[171],"variety":[174],"domains.":[176]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
