{"id":"https://openalex.org/W2014597988","doi":"https://doi.org/10.1145/2505515.2505762","title":"Searching similar segments over textual event sequences","display_name":"Searching similar segments over textual event sequences","publication_year":2013,"publication_date":"2013-10-27","ids":{"openalex":"https://openalex.org/W2014597988","doi":"https://doi.org/10.1145/2505515.2505762","mag":"2014597988"},"language":"en","primary_location":{"id":"doi:10.1145/2505515.2505762","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2505515.2505762","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM international conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100723083","display_name":"Liang Tang","orcid":"https://orcid.org/0000-0001-6977-6534"},"institutions":[{"id":"https://openalex.org/I19700959","display_name":"Florida International University","ror":"https://ror.org/02gz6gg07","country_code":"US","type":"education","lineage":["https://openalex.org/I19700959"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Liang Tang","raw_affiliation_strings":["Florida International University, Miami, FL, USA"],"affiliations":[{"raw_affiliation_string":"Florida International University, Miami, FL, USA","institution_ids":["https://openalex.org/I19700959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100455259","display_name":"Tao Li","orcid":"https://orcid.org/0000-0001-9277-1539"},"institutions":[{"id":"https://openalex.org/I19700959","display_name":"Florida International University","ror":"https://ror.org/02gz6gg07","country_code":"US","type":"education","lineage":["https://openalex.org/I19700959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tao Li","raw_affiliation_strings":["Florida International University, Miami, FL, USA"],"affiliations":[{"raw_affiliation_string":"Florida International University, Miami, FL, USA","institution_ids":["https://openalex.org/I19700959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049219173","display_name":"Shu\u2010Ching Chen","orcid":"https://orcid.org/0000-0001-9209-390X"},"institutions":[{"id":"https://openalex.org/I19700959","display_name":"Florida International University","ror":"https://ror.org/02gz6gg07","country_code":"US","type":"education","lineage":["https://openalex.org/I19700959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shu-Ching Chen","raw_affiliation_strings":["Florida International University, Miami, FL, USA"],"affiliations":[{"raw_affiliation_string":"Florida International University, Miami, FL, USA","institution_ids":["https://openalex.org/I19700959"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101942006","display_name":"Shunzhi Zhu","orcid":"https://orcid.org/0000-0001-8321-1169"},"institutions":[{"id":"https://openalex.org/I75867142","display_name":"Xiamen University of Technology","ror":"https://ror.org/01285e189","country_code":"CN","type":"education","lineage":["https://openalex.org/I75867142"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shunzhi Zhu","raw_affiliation_strings":["Xiamen University of Technology, Xiamen, China","Xiamen University of Technology, Xiamen, CHINA"],"affiliations":[{"raw_affiliation_string":"Xiamen University of Technology, Xiamen, China","institution_ids":["https://openalex.org/I75867142"]},{"raw_affiliation_string":"Xiamen University of Technology, Xiamen, CHINA","institution_ids":["https://openalex.org/I75867142"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100723083"],"corresponding_institution_ids":["https://openalex.org/I19700959"],"apc_list":null,"apc_paid":null,"fwci":0.4942,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.75875668,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"329","last_page":"338"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/substring","display_name":"Substring","score":0.8731602430343628},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7688485980033875},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.7175168395042419},{"id":"https://openalex.org/keywords/suffix-array","display_name":"Suffix array","score":0.634458601474762},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6104752421379089},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5985603928565979},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4931935667991638},{"id":"https://openalex.org/keywords/string-searching-algorithm","display_name":"String searching algorithm","score":0.48895370960235596},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.48793837428092957},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4836758077144623},{"id":"https://openalex.org/keywords/suffix","display_name":"Suffix","score":0.4642186164855957},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.4606170356273651},{"id":"https://openalex.org/keywords/locality-sensitive-hashing","display_name":"Locality-sensitive hashing","score":0.4544830322265625},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4320666790008545},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.3819286823272705},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3785867393016815},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3172927796840668},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.2634729743003845},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.13477149605751038},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09515205025672913}],"concepts":[{"id":"https://openalex.org/C182407805","wikidata":"https://www.wikidata.org/wiki/Q2626534","display_name":"Substring","level":3,"score":0.8731602430343628},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7688485980033875},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.7175168395042419},{"id":"https://openalex.org/C2779259728","wikidata":"https://www.wikidata.org/wiki/Q281472","display_name":"Suffix array","level":3,"score":0.634458601474762},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6104752421379089},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5985603928565979},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4931935667991638},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.48895370960235596},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.48793837428092957},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4836758077144623},{"id":"https://openalex.org/C2779804580","wikidata":"https://www.wikidata.org/wiki/Q102047","display_name":"Suffix","level":2,"score":0.4642186164855957},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.4606170356273651},{"id":"https://openalex.org/C74270461","wikidata":"https://www.wikidata.org/wiki/Q1625299","display_name":"Locality-sensitive hashing","level":4,"score":0.4544830322265625},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4320666790008545},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3819286823272705},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3785867393016815},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3172927796840668},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.2634729743003845},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.13477149605751038},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09515205025672913},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2505515.2505762","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2505515.2505762","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM international conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.648.4721","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.648.4721","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://users.cis.fiu.edu/~chens/PDF/cikm2013.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W164902916","https://openalex.org/W1502916507","https://openalex.org/W1565377632","https://openalex.org/W1831068561","https://openalex.org/W1938740620","https://openalex.org/W1956559956","https://openalex.org/W1979464422","https://openalex.org/W1988338552","https://openalex.org/W1991800036","https://openalex.org/W2019076926","https://openalex.org/W2021809202","https://openalex.org/W2055043387","https://openalex.org/W2081193615","https://openalex.org/W2100169722","https://openalex.org/W2104001127","https://openalex.org/W2112099725","https://openalex.org/W2115056012","https://openalex.org/W2118269922","https://openalex.org/W2118703123","https://openalex.org/W2124985265","https://openalex.org/W2136159049","https://openalex.org/W2138087993","https://openalex.org/W2145065594","https://openalex.org/W2145725688","https://openalex.org/W2148356029","https://openalex.org/W2148781362","https://openalex.org/W2152565070","https://openalex.org/W2153470728","https://openalex.org/W2158874082","https://openalex.org/W2161449253","https://openalex.org/W2161488606","https://openalex.org/W2169953282","https://openalex.org/W2170899819","https://openalex.org/W2533248932"],"related_works":["https://openalex.org/W2902482624","https://openalex.org/W2902555313","https://openalex.org/W2376315482","https://openalex.org/W4249054680","https://openalex.org/W3112977702","https://openalex.org/W2218650848","https://openalex.org/W2366227422","https://openalex.org/W1993281991","https://openalex.org/W3022344494","https://openalex.org/W2355168454"],"abstract_inverted_index":{"Sequential":[0],"data":[1,28,32,110,227],"is":[2,34,50,68,180],"prevalent":[3],"in":[4,29,92,200],"many":[5],"scientific":[6],"and":[7,15,25,65,166,228],"commercial":[8],"applications":[9],"such":[10],"as":[11],"bioinformatics,":[12],"system":[13,58,74,90,99,103,225],"security":[14],"networking.":[16],"Similarity":[17],"search":[18,106,218],"has":[19,184],"been":[20],"widely":[21],"studied":[22],"for":[23,98,108,147],"symbolic":[24],"time":[26],"series":[27],"which":[30,95],"each":[31,48,66],"object":[33,49],"a":[35,51,69,127,143,181,207],"symbol":[36],"or":[37,79],"numeric":[38],"value.":[39],"Textual":[40],"event":[41,63,67,86,154],"sequences":[42,44,64,131],"are":[43,60,96,119,132],"of":[45,84,160],"events,":[46],"where":[47],"message":[52,71],"describing":[53],"an":[54,85,158],"event.":[55],"For":[56],"example,":[57],"logs":[59],"typical":[61],"textual":[62,70,109,153],"recording":[72],"internal":[73],"operations,":[75],"statuses,":[76],"configuration":[77],"modifications":[78],"execution":[80],"errors.":[81],"Similar":[82],"segments":[83,125,151,214],"sequence":[87,197],"reveals":[88],"similar":[89,150],"behaviors":[91],"the":[93,173,191,229],"past":[94],"helpful":[97],"administrators":[100],"to":[101,121,190,210],"diagnose":[102],"problems.":[104],"Existing":[105],"indexing":[107],"only":[111],"focus":[112],"on":[113,223],"unordered":[114],"data.":[115],"Substring":[116],"matching":[117],"methods":[118,239],"able":[120],"efficiently":[122,148],"find":[123],"matched":[124],"over":[126,152],"sequence,":[128],"however,":[129],"their":[130],"single":[133],"values":[134],"rather":[135],"than":[136],"texts.":[137],"In":[138],"this":[139,201,203],"paper,":[140,202],"we":[141],"propose":[142],"method,":[144],"suffix":[145,167],"matrix,":[146],"searching":[149],"sequences.":[155],"It":[156],"provides":[157],"integration":[159],"two":[161],"disparate":[162],"techniques:":[163],"locality-sensitive":[164],"hashing":[165],"arrays.":[168],"This":[169],"method":[170,204,236],"also":[171],"supports":[172],"k-dissimilar":[174,178,213],"segment":[175,179,182],"search.":[176],"A":[177],"that":[183,233],"at":[185],"most":[186],"k":[187],"dissimilar":[188],"events":[189],"query":[192],"sequence.":[193],"By":[194],"using":[195,240],"random":[196],"mask":[198],"proposed":[199,235],"can":[205],"have":[206],"high":[208],"probability":[209],"reach":[211],"all":[212],"without":[215],"increasing":[216],"much":[217],"cost.":[219],"We":[220],"conduct":[221],"experiments":[222],"real":[224],"log":[226],"experimental":[230],"results":[231],"show":[232],"our":[234],"outperforms":[237],"alternative":[238],"existing":[241],"techniques.":[242]},"counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
