{"id":"https://openalex.org/W2977726997","doi":"https://doi.org/10.5220/0008121102570264","title":"Knowledge Discovery from Log Data Analysis in a Multi-source Search System based on Deep Cleaning","display_name":"Knowledge Discovery from Log Data Analysis in a Multi-source Search System based on Deep Cleaning","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2977726997","doi":"https://doi.org/10.5220/0008121102570264","mag":"2977726997"},"language":"en","primary_location":{"id":"doi:10.5220/0008121102570264","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0008121102570264","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th International Conference on Web Information Systems and Technologies","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0008121102570264","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028548919","display_name":"Fatma Zohra Lebib","orcid":"https://orcid.org/0000-0002-1821-8097"},"institutions":[{"id":"https://openalex.org/I4210095777","display_name":"Centre de Recherche sur l'Information Scientifique et Technique","ror":"https://ror.org/01k1bte55","country_code":"DZ","type":"government","lineage":["https://openalex.org/I4210095777","https://openalex.org/I4210114810"]},{"id":"https://openalex.org/I157169809","display_name":"University of Sciences and Technology Houari Boumediene","ror":"https://ror.org/02kb89c09","country_code":"DZ","type":"education","lineage":["https://openalex.org/I157169809"]}],"countries":["DZ"],"is_corresponding":true,"raw_author_name":"Fatma Lebib","raw_affiliation_strings":["University of Science and Technology Houari Boumediene, USTHB, Algiers, Algeria, Research Center in Scientific and Technical Information, CERIST, Algiers and Algeria, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology Houari Boumediene, USTHB, Algiers, Algeria, Research Center in Scientific and Technical Information, CERIST, Algiers and Algeria, --- Select a Country ---","institution_ids":["https://openalex.org/I157169809","https://openalex.org/I4210095777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060801076","display_name":"Hakima Mellah","orcid":null},"institutions":[{"id":"https://openalex.org/I4210095777","display_name":"Centre de Recherche sur l'Information Scientifique et Technique","ror":"https://ror.org/01k1bte55","country_code":"DZ","type":"government","lineage":["https://openalex.org/I4210095777","https://openalex.org/I4210114810"]}],"countries":["DZ"],"is_corresponding":false,"raw_author_name":"Hakima Mellah","raw_affiliation_strings":["Research Center in Scientific and Technical Information, CERIST, Algiers and Algeria, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Research Center in Scientific and Technical Information, CERIST, Algiers and Algeria, --- Select a Country ---","institution_ids":["https://openalex.org/I4210095777"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082266809","display_name":"Abdelkrim Meziane","orcid":"https://orcid.org/0000-0003-0894-8376"},"institutions":[{"id":"https://openalex.org/I4210095777","display_name":"Centre de Recherche sur l'Information Scientifique et Technique","ror":"https://ror.org/01k1bte55","country_code":"DZ","type":"government","lineage":["https://openalex.org/I4210095777","https://openalex.org/I4210114810"]}],"countries":["DZ"],"is_corresponding":false,"raw_author_name":"Abdelkrim Meziane","raw_affiliation_strings":["Research Center in Scientific and Technical Information, CERIST, Algiers and Algeria, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Research Center in Scientific and Technical Information, CERIST, Algiers and Algeria, --- Select a Country ---","institution_ids":["https://openalex.org/I4210095777"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5028548919"],"corresponding_institution_ids":["https://openalex.org/I157169809","https://openalex.org/I4210095777"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.16649841,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"257","last_page":"264"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8409866094589233},{"id":"https://openalex.org/keywords/web-log-analysis-software","display_name":"Web log analysis software","score":0.6649097204208374},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6048897504806519},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5005383491516113},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4796890914440155},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.45376598834991455},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.2760840058326721},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.25665658712387085},{"id":"https://openalex.org/keywords/web-navigation","display_name":"Web navigation","score":0.1553167998790741},{"id":"https://openalex.org/keywords/static-web-page","display_name":"Static web page","score":0.1015738844871521},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.0876537561416626}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8409866094589233},{"id":"https://openalex.org/C104352257","wikidata":"https://www.wikidata.org/wiki/Q1238961","display_name":"Web log analysis software","level":5,"score":0.6649097204208374},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6048897504806519},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5005383491516113},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4796890914440155},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.45376598834991455},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.2760840058326721},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.25665658712387085},{"id":"https://openalex.org/C61096286","wikidata":"https://www.wikidata.org/wiki/Q7978592","display_name":"Web navigation","level":3,"score":0.1553167998790741},{"id":"https://openalex.org/C173576120","wikidata":"https://www.wikidata.org/wiki/Q2641220","display_name":"Static web page","level":4,"score":0.1015738844871521},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0876537561416626}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5220/0008121102570264","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0008121102570264","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th International Conference on Web Information Systems and Technologies","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.5220/0008121102570264","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0008121102570264","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th International Conference on Web Information Systems and Technologies","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2023370952","https://openalex.org/W167737004","https://openalex.org/W1964038241","https://openalex.org/W2185038817","https://openalex.org/W2385957133","https://openalex.org/W3590553","https://openalex.org/W2004064649","https://openalex.org/W3141094475","https://openalex.org/W1974306718","https://openalex.org/W2390285850"],"abstract_inverted_index":{"In":[0,128],"a":[1,63],"multi-source":[2,64],"search":[3,15,65],"system,":[4],"understanding":[5],"users\u2019":[6],"interests":[7],"and":[8,16,44,79,84,116,151,192],"behaviour":[9],"is":[10,75,158],"essential":[11],"to":[12,21,46,76,130,168,175],"improve":[13],"the":[14,18,29,59,68,81,100,105,117,131,140,162,177,197],"adapt":[17],"results":[19],"according":[20],"each":[22,200],"user":[23,50],"profile.":[24,51],"The":[25,73,92,180],"interesting":[26],"information":[27,190],"characterizing":[28],"users":[30,87],"can":[31,183],"be":[32,41,184],"hidden":[33],"in":[34],"large":[35],"log":[36,60,109,141],"files,":[37,148],"whereas":[38],"it":[39],"must":[40],"discovered,":[42],"extracted":[43],"analyzed":[45],"build":[47],"an":[48,55],"accurate":[49],"This":[52,173],"paper":[53],"presents":[54],"approach":[56,94],"which":[57,160],"analyzes":[58,161],"data":[61,107,123,138,182],"of":[62,86,96,146,153,165,199],"system":[66],"using":[67],"web":[69],"usage":[70],"mining":[71],"techniques.":[72],"aim":[74],"capture,":[77],"model":[78],"analyze":[80],"behavioural":[82],"patterns":[83],"profiles":[85],"interacting":[88],"with":[89],"this":[90],"system.":[91],"proposed":[93],"consists":[95],"two":[97],"major":[98],"steps,":[99],"first":[101],"step":[102,119],"\u201cpre-processing\u201d":[103],"eliminates":[104],"unwanted":[106,171],"from":[108,139],"files":[110],"based":[111],"on":[112,124],"predefined":[113],"cleaning":[114,133,157],"rules,":[115],"second":[118],"\u201cprocessing\u201d":[120],"extracts":[121],"useful":[122],"user\u2019s":[125],"previous":[126],"queries.":[127],"addition":[129],"conventional":[132],"process":[134],"that":[135],"removes":[136],"irrelevant":[137],"file,":[142],"such":[143],"as":[144],"access":[145],"multimedia":[147],"error":[149],"codes":[150],"accesses":[152],"Web":[154],"robots,":[155],"deep":[156],"proposed,":[159],"queries":[163],"structure":[164],"different":[166],"sources":[167,195],"further":[169],"eliminate":[170],"data.":[172],"allows":[174],"accelerate":[176],"processing":[178],"phase.":[179],"generated":[181],"used":[185],"for":[186,196],"personalizing":[187],"user-system":[188],"interaction,":[189],"filtering":[191],"recommending":[193],"appropriate":[194],"needs":[198],"user.":[201]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
