{"id":"https://openalex.org/W2011508511","doi":"https://doi.org/10.1016/s0169-7552(98)00109-3","title":"The origin of (document) species","display_name":"The origin of (document) species","publication_year":1998,"publication_date":"1998-04-01","ids":{"openalex":"https://openalex.org/W2011508511","doi":"https://doi.org/10.1016/s0169-7552(98)00109-3","mag":"2011508511"},"language":"en","primary_location":{"id":"doi:10.1016/s0169-7552(98)00109-3","is_oa":false,"landing_page_url":"https://doi.org/10.1016/s0169-7552(98)00109-3","pdf_url":null,"source":{"id":"https://openalex.org/S3084184","display_name":"Computer Networks and ISDN Systems","issn_l":"0169-7552","issn":["0169-7552","1879-2324"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computer Networks and ISDN Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113655761","display_name":"Rohit Khare","orcid":null},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Rohit Khare","raw_affiliation_strings":["University of California at Irvine, Department of Computer Science, Irvine, CA 92697-3425, USA"],"affiliations":[{"raw_affiliation_string":"University of California at Irvine, Department of Computer Science, Irvine, CA 92697-3425, USA","institution_ids":["https://openalex.org/I204250578"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085823210","display_name":"Adam Rifkin","orcid":null},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Adam Rifkin","raw_affiliation_strings":["California Institute of Technology, Computer Science Department, Pasadena, CA 91125, USA"],"affiliations":[{"raw_affiliation_string":"California Institute of Technology, Computer Science Department, Pasadena, CA 91125, USA","institution_ids":["https://openalex.org/I122411786"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5113655761"],"corresponding_institution_ids":["https://openalex.org/I204250578"],"apc_list":null,"apc_paid":null,"fwci":2.4388,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.91988387,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"30","issue":"1-7","first_page":"389","last_page":"397"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9850000143051147,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8798545598983765},{"id":"https://openalex.org/keywords/ruleml","display_name":"RuleML","score":0.6526475548744202},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.6231766939163208},{"id":"https://openalex.org/keywords/markup-language","display_name":"Markup language","score":0.5929451584815979},{"id":"https://openalex.org/keywords/html","display_name":"HTML","score":0.5486652255058289},{"id":"https://openalex.org/keywords/sgml","display_name":"SGML","score":0.48477786779403687},{"id":"https://openalex.org/keywords/web-standards","display_name":"Web standards","score":0.43785354495048523},{"id":"https://openalex.org/keywords/style-sheet","display_name":"Style sheet","score":0.4288044273853302},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.420485258102417},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.4151875972747803},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.37780988216400146},{"id":"https://openalex.org/keywords/document-structure-description","display_name":"Document Structure Description","score":0.3732505142688751},{"id":"https://openalex.org/keywords/xhtml","display_name":"XHTML","score":0.3467467129230499},{"id":"https://openalex.org/keywords/web-service","display_name":"Web service","score":0.26314204931259155},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.25325489044189453}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8798545598983765},{"id":"https://openalex.org/C196388810","wikidata":"https://www.wikidata.org/wiki/Q631877","display_name":"RuleML","level":5,"score":0.6526475548744202},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.6231766939163208},{"id":"https://openalex.org/C45874996","wikidata":"https://www.wikidata.org/wiki/Q37045","display_name":"Markup language","level":3,"score":0.5929451584815979},{"id":"https://openalex.org/C138708601","wikidata":"https://www.wikidata.org/wiki/Q8811","display_name":"HTML","level":3,"score":0.5486652255058289},{"id":"https://openalex.org/C62701983","wikidata":"https://www.wikidata.org/wiki/Q207819","display_name":"SGML","level":4,"score":0.48477786779403687},{"id":"https://openalex.org/C182321512","wikidata":"https://www.wikidata.org/wiki/Q1153289","display_name":"Web standards","level":3,"score":0.43785354495048523},{"id":"https://openalex.org/C89159866","wikidata":"https://www.wikidata.org/wiki/Q4119753","display_name":"Style sheet","level":3,"score":0.4288044273853302},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.420485258102417},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.4151875972747803},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37780988216400146},{"id":"https://openalex.org/C68699486","wikidata":"https://www.wikidata.org/wiki/Q265904","display_name":"Document Structure Description","level":3,"score":0.3732505142688751},{"id":"https://openalex.org/C189139006","wikidata":"https://www.wikidata.org/wiki/Q166074","display_name":"XHTML","level":4,"score":0.3467467129230499},{"id":"https://openalex.org/C35578498","wikidata":"https://www.wikidata.org/wiki/Q193424","display_name":"Web service","level":2,"score":0.26314204931259155},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.25325489044189453}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/s0169-7552(98)00109-3","is_oa":false,"landing_page_url":"https://doi.org/10.1016/s0169-7552(98)00109-3","pdf_url":null,"source":{"id":"https://openalex.org/S3084184","display_name":"Computer Networks and ISDN Systems","issn_l":"0169-7552","issn":["0169-7552","1879-2324"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computer Networks and ISDN Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332467","display_name":"U.S. Air Force","ror":"https://ror.org/006gmme17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W198844848","https://openalex.org/W203724739","https://openalex.org/W1544205754","https://openalex.org/W1606487221","https://openalex.org/W2011387993","https://openalex.org/W2024660412","https://openalex.org/W2057917144","https://openalex.org/W2091167778","https://openalex.org/W2171908848","https://openalex.org/W2475481088","https://openalex.org/W6608050761","https://openalex.org/W6608320290","https://openalex.org/W6665027051","https://openalex.org/W6685399247"],"related_works":["https://openalex.org/W2580812415","https://openalex.org/W2775767401","https://openalex.org/W2625590187","https://openalex.org/W2774879466","https://openalex.org/W361548100","https://openalex.org/W2010819939","https://openalex.org/W4242799722","https://openalex.org/W1518743274","https://openalex.org/W1974368957","https://openalex.org/W2465587010"],"abstract_inverted_index":null,"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
