{"id":"https://openalex.org/W4231751361","doi":"https://doi.org/10.1504/ijdats.2016.10002351","title":"Web informative content identification and filtering using machine learning technique","display_name":"Web informative content identification and filtering using machine learning technique","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W4231751361","doi":"https://doi.org/10.1504/ijdats.2016.10002351"},"language":"en","primary_location":{"id":"doi:10.1504/ijdats.2016.10002351","is_oa":false,"landing_page_url":"https://doi.org/10.1504/ijdats.2016.10002351","pdf_url":null,"source":{"id":"https://openalex.org/S118326976","display_name":"International Journal of Data Analysis Techniques and Strategies","issn_l":"1755-8050","issn":["1755-8050","1755-8069"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317825","host_organization_name":"Inderscience Publishers","host_organization_lineage":["https://openalex.org/P4310317825"],"host_organization_lineage_names":["Inderscience Publishers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Data Analysis Techniques and Strategies","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100655143","display_name":"Sanjay Kumar Sharma","orcid":"https://orcid.org/0000-0002-2546-8262"},"institutions":[{"id":"https://openalex.org/I102117144","display_name":"Banasthali University","ror":"https://ror.org/05ycegt40","country_code":"IN","type":"education","lineage":["https://openalex.org/I102117144"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sanjay Kumar Sharma","raw_affiliation_strings":["Department of Computer Science, Banasthali University, Rajasthan, 304022, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Banasthali University, Rajasthan, 304022, India","institution_ids":["https://openalex.org/I102117144"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056945678","display_name":"Neetu Narwal","orcid":"https://orcid.org/0000-0003-1088-1385"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Neetu Narwal","raw_affiliation_strings":["Maharaja Surajmal Institute, C-4, Janakpuri, New Delhi, 110054, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Maharaja Surajmal Institute, C-4, Janakpuri, New Delhi, 110054, India","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.5547552,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"8","issue":"4","first_page":"332","last_page":"332"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8284124135971069},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.788373589515686},{"id":"https://openalex.org/keywords/web-content","display_name":"Web content","score":0.4649803340435028},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.45406386256217957},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.44613486528396606},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4344802796840668},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4187923073768616},{"id":"https://openalex.org/keywords/page-view","display_name":"Page view","score":0.4150409996509552},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4134017825126648},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3756266236305237},{"id":"https://openalex.org/keywords/static-web-page","display_name":"Static web page","score":0.334075391292572},{"id":"https://openalex.org/keywords/web-navigation","display_name":"Web navigation","score":0.3104979693889618},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.29123613238334656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8284124135971069},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.788373589515686},{"id":"https://openalex.org/C2776324614","wikidata":"https://www.wikidata.org/wiki/Q3948731","display_name":"Web content","level":3,"score":0.4649803340435028},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.45406386256217957},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.44613486528396606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4344802796840668},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4187923073768616},{"id":"https://openalex.org/C103645729","wikidata":"https://www.wikidata.org/wiki/Q911187","display_name":"Page view","level":5,"score":0.4150409996509552},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4134017825126648},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3756266236305237},{"id":"https://openalex.org/C173576120","wikidata":"https://www.wikidata.org/wiki/Q2641220","display_name":"Static web page","level":4,"score":0.334075391292572},{"id":"https://openalex.org/C61096286","wikidata":"https://www.wikidata.org/wiki/Q7978592","display_name":"Web navigation","level":3,"score":0.3104979693889618},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.29123613238334656}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1504/ijdats.2016.10002351","is_oa":false,"landing_page_url":"https://doi.org/10.1504/ijdats.2016.10002351","pdf_url":null,"source":{"id":"https://openalex.org/S118326976","display_name":"International Journal of Data Analysis Techniques and Strategies","issn_l":"1755-8050","issn":["1755-8050","1755-8069"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317825","host_organization_name":"Inderscience Publishers","host_organization_lineage":["https://openalex.org/P4310317825"],"host_organization_lineage_names":["Inderscience Publishers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Data Analysis Techniques and Strategies","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7099999785423279,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W1979144454","https://openalex.org/W2552270810","https://openalex.org/W2055154498","https://openalex.org/W2045069236","https://openalex.org/W2051097555","https://openalex.org/W4230700435","https://openalex.org/W2087758976","https://openalex.org/W2492611973","https://openalex.org/W2074126298","https://openalex.org/W4237105987"],"abstract_inverted_index":{"Internet":[0],"has":[1,10],"gained":[2],"greatest":[3],"acceptance":[4],"as":[5],"reservoirs":[6],"of":[7,22,81,145,154],"information.":[8],"It":[9],"been":[11,118],"observed":[12],"that":[13,162],"the":[14,38,47,64,68,79,82,87,94,105,113,135,146,152,157,163],"web":[15,39,69,83,88,95,147],"page":[16,40,70,89,96],"along":[17],"with":[18],"main":[19,142],"content":[20,66,80,143],"comprises":[21],"noise":[23],"(advertisement,":[24],"external":[25,167],"links),":[26],"which":[27,62],"poses":[28],"difficulty":[29],"for":[30,92,172],"various":[31],"search":[32],"engines":[33],"crawlers":[34],"to":[35,46,75,97,111,131,140],"correctly":[36],"classify":[37],"and":[41,71,77,102,160],"it":[42],"also":[43,150],"provides":[44],"distraction":[45],"user":[48],"interested":[49],"in":[50],"gathering":[51],"relevant":[52,65],"data.":[53],"In":[54],"this":[55,73],"paper,":[56],"we":[57],"proposed":[58],"a":[59],"novel":[60],"approach":[61],"categorises":[63],"from":[67,107,166],"use":[72],"information":[74],"filter":[76],"rearrange":[78],"page.":[84,148],"We":[85,149],"used":[86,139],"segmentation":[90],"algorithm":[91],"parsing":[93],"obtain":[98],"non-overlapping":[99],"visual":[100,109],"blocks":[101,110],"then":[103],"extracted":[104],"features":[106,155],"these":[108],"build":[112],"dataset.":[114],"The":[115],"dataset":[116],"have":[117,169],"trained":[119],"using":[120],"popular":[121],"machine":[122],"learning":[123,158],"classifier":[124],"techniques":[125],"(neural":[126],"network,":[127],"RBF":[128],"neural":[129],"network)":[130],"discriminate":[132],"content.":[133],"Finally,":[134],"classification":[136],"output":[137],"is":[138],"perform":[141],"filtering":[144],"analysed":[151],"importance":[153],"on":[156],"process":[159],"perceive":[161],"embedded":[164],"objects":[165],"source":[168],"highest":[170],"significance":[171],"block":[173],"identification.":[174]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
