{"id":"https://openalex.org/W2073759582","doi":"https://doi.org/10.1145/1089815.1089820","title":"Distributed higher order association rule mining using information extracted from textual data","display_name":"Distributed higher order association rule mining using information extracted from textual data","publication_year":2005,"publication_date":"2005-06-01","ids":{"openalex":"https://openalex.org/W2073759582","doi":"https://doi.org/10.1145/1089815.1089820","mag":"2073759582"},"language":"en","primary_location":{"id":"doi:10.1145/1089815.1089820","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1089815.1089820","pdf_url":null,"source":{"id":"https://openalex.org/S4210176598","display_name":"ACM SIGKDD Explorations Newsletter","issn_l":"1931-0145","issn":["1931-0145","1931-0153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGKDD Explorations Newsletter","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087997370","display_name":"Shenzhi Li","orcid":null},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Shenzhi Li","raw_affiliation_strings":["Lehigh University, Bethlehem, PA"],"affiliations":[{"raw_affiliation_string":"Lehigh University, Bethlehem, PA","institution_ids":["https://openalex.org/I186143895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083841001","display_name":"Tianhao Wu","orcid":"https://orcid.org/0000-0001-7465-1242"},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tianhao Wu","raw_affiliation_strings":["Lehigh University, Bethlehem, PA"],"affiliations":[{"raw_affiliation_string":"Lehigh University, Bethlehem, PA","institution_ids":["https://openalex.org/I186143895"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011634099","display_name":"William M. Pottenger","orcid":null},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William M. Pottenger","raw_affiliation_strings":["Lehigh University, Bethlehem, PA"],"affiliations":[{"raw_affiliation_string":"Lehigh University, Bethlehem, PA","institution_ids":["https://openalex.org/I186143895"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5087997370"],"corresponding_institution_ids":["https://openalex.org/I186143895"],"apc_list":null,"apc_paid":null,"fwci":5.9363,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.95843685,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"7","issue":"1","first_page":"26","last_page":"35"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8472983837127686},{"id":"https://openalex.org/keywords/association-rule-learning","display_name":"Association rule learning","score":0.8063012361526489},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6445170640945435},{"id":"https://openalex.org/keywords/distributed-database","display_name":"Distributed database","score":0.6291359663009644},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.5950233936309814},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.5585007667541504},{"id":"https://openalex.org/keywords/distributed-computing-environment","display_name":"Distributed Computing Environment","score":0.5095937252044678},{"id":"https://openalex.org/keywords/distributed-algorithm","display_name":"Distributed algorithm","score":0.4918351173400879},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.48720163106918335},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.4480736553668976},{"id":"https://openalex.org/keywords/concept-mining","display_name":"Concept mining","score":0.41782882809638977},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.34081846475601196},{"id":"https://openalex.org/keywords/web-mining","display_name":"Web mining","score":0.28936445713043213},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.16859170794487},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11366552114486694},{"id":"https://openalex.org/keywords/web-service","display_name":"Web service","score":0.10615432262420654}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8472983837127686},{"id":"https://openalex.org/C193524817","wikidata":"https://www.wikidata.org/wiki/Q386780","display_name":"Association rule learning","level":2,"score":0.8063012361526489},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6445170640945435},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.6291359663009644},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.5950233936309814},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.5585007667541504},{"id":"https://openalex.org/C3739613","wikidata":"https://www.wikidata.org/wiki/Q679003","display_name":"Distributed Computing Environment","level":2,"score":0.5095937252044678},{"id":"https://openalex.org/C130120984","wikidata":"https://www.wikidata.org/wiki/Q2835898","display_name":"Distributed algorithm","level":2,"score":0.4918351173400879},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.48720163106918335},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.4480736553668976},{"id":"https://openalex.org/C176775163","wikidata":"https://www.wikidata.org/wiki/Q5158396","display_name":"Concept mining","level":4,"score":0.41782882809638977},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.34081846475601196},{"id":"https://openalex.org/C197046077","wikidata":"https://www.wikidata.org/wiki/Q785337","display_name":"Web mining","level":3,"score":0.28936445713043213},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.16859170794487},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11366552114486694},{"id":"https://openalex.org/C35578498","wikidata":"https://www.wikidata.org/wiki/Q193424","display_name":"Web service","level":2,"score":0.10615432262420654}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1089815.1089820","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1089815.1089820","pdf_url":null,"source":{"id":"https://openalex.org/S4210176598","display_name":"ACM SIGKDD Explorations Newsletter","issn_l":"1931-0145","issn":["1931-0145","1931-0153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGKDD Explorations Newsletter","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.77.8257","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.77.8257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.dimacs.rutgers.edu/~billp/pubs/SIGKDDExplorations.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.800000011920929,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W99053925","https://openalex.org/W395877202","https://openalex.org/W1526785773","https://openalex.org/W1553696291","https://openalex.org/W1577783107","https://openalex.org/W1906561224","https://openalex.org/W1964433626","https://openalex.org/W2004748427","https://openalex.org/W2008896880","https://openalex.org/W2068541969","https://openalex.org/W2078937669","https://openalex.org/W2083838623","https://openalex.org/W2093367651","https://openalex.org/W2093456341","https://openalex.org/W2102766632","https://openalex.org/W2110783067","https://openalex.org/W2112163170","https://openalex.org/W2119409601","https://openalex.org/W2128051069","https://openalex.org/W2137833366","https://openalex.org/W2166559705","https://openalex.org/W2966207845","https://openalex.org/W4212848460"],"related_works":["https://openalex.org/W3009866696","https://openalex.org/W127900883","https://openalex.org/W997248972","https://openalex.org/W2023322671","https://openalex.org/W17303578","https://openalex.org/W2148851125","https://openalex.org/W2013919567","https://openalex.org/W3154587653","https://openalex.org/W2316248136","https://openalex.org/W2368240274"],"abstract_inverted_index":{"The":[0,153],"burgconing":[1],"amount":[2],"of":[3,69,105,211,219,233,249,260],"textual":[4,76,92],"data":[5,133,220,256],"in":[6,14,90,149,158,194,243,262],"distributed":[7,25,39,91,132,151,179,199,253],"sources":[8],"combined":[9],"with":[10],"the":[11,21,33,57,66,106,174,198,202,217,231,234,238,250,258,263],"obstacles":[12],"involved":[13],"creating":[15],"and":[16,28,131,161],"maintaining":[17],"central":[18],"repositories":[19],"motivates":[20],"need":[22,34],"for":[23,116],"effective":[24],"information":[26,73,129,139,154],"extraction":[27,130,140],"mining":[29,182],"techniques.":[30],"Recently,":[31],"as":[32],"to":[35,142,167,186,229],"mine":[36],"patterns":[37],"across":[38,197],"databases":[40,58,70,160,200],"has":[41],"grown,":[42],"Distributed":[43,117],"Association":[44],"Rule":[45],"Mining":[46],"(D-ARM)":[47],"algorithms":[48,80],"have":[49],"been":[50],"developed.":[51],"These":[52],"algorithms,":[53,206],"however,":[54],"assume":[55],"that":[56,94,127,216],"are":[59,95,227],"either":[60],"horizontally":[61,99],"or":[62,223],"vertically":[63,97],"distributed.":[64],"In":[65,108],"special":[67],"case":[68],"populated":[71],"from":[72,75,146],"extracted":[74,155,175],"data,":[77],"existing":[78,205],"D-ARM":[79],"cannot":[81],"discover":[82,187],"rules":[83],"based":[84],"on":[85,173,252],"higher-order":[86,188],"associations":[87,189],"between":[88,190],"items":[89,191],"documents":[93],"neither":[96,209],"nor":[98,215],"distributed,":[100],"but":[101],"rather":[102],"a":[103,114,124,137,150,162,177,212],"hybrid":[104,125],"two.":[107],"this":[109],"article":[110],"we":[111],"present":[112],"D-HOTM,":[113],"framework":[115],"Higher":[118],"Order":[119],"Text":[120],"Mining.":[121],"D-HOTM":[122,207,261],"is":[123,156,165,184],"approach":[126],"combines":[128],"mining.":[134],"We":[135],"employ":[136],"novel":[138,178],"technique":[141],"extract":[143],"meaningful":[144],"entities":[145],"unstructured":[147],"text":[148],"environment.":[152],"stored":[157],"local":[159],"mapping":[163,235],"function":[164,236],"applied":[166,185],"identify":[168],"globally":[169],"unique":[170],"keys.":[171,203],"Based":[172],"information,":[176],"association":[180],"rule":[181],"algorithm":[183,251],"(i.e.,":[192],"entities)":[193],"records":[195],"fragmented":[196],"using":[201],"Unlike":[204],"requires":[208],"knowledge":[210],"global":[213],"schema":[214],"distribution":[218],"be":[221],"horizontal":[222],"vertical.":[224],"Evaluation":[225],"methods":[226],"proposed":[228],"incorporate":[230],"performance":[232],"into":[237],"traditional":[239],"support":[240],"metric":[241],"used":[242],"ARM":[244],"evaluation.":[245],"An":[246],"example":[247],"application":[248],"law":[254],"enforcement":[255],"demonstrates":[257],"relevance":[259],"fight":[264],"against":[265],"terrorism.":[266]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
