{"id":"https://openalex.org/W4224442743","doi":"https://doi.org/10.3233/ida-205107","title":"Online learning agents for cost-sensitive topical data acquisition from the web","display_name":"Online learning agents for cost-sensitive topical data acquisition from the web","publication_year":2022,"publication_date":"2022-04-18","ids":{"openalex":"https://openalex.org/W4224442743","doi":"https://doi.org/10.3233/ida-205107"},"language":"en","primary_location":{"id":"doi:10.3233/ida-205107","is_oa":false,"landing_page_url":"https://doi.org/10.3233/ida-205107","pdf_url":null,"source":{"id":"https://openalex.org/S2498839158","display_name":"Intelligent Data Analysis","issn_l":"1088-467X","issn":["1088-467X","1571-4128"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Intelligent Data Analysis","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021247287","display_name":"Mahdi Naghibi","orcid":null},"institutions":[{"id":"https://openalex.org/I78323350","display_name":"Malek Ashtar University of Technology","ror":"https://ror.org/0043ezw98","country_code":"IR","type":"education","lineage":["https://openalex.org/I78323350"]}],"countries":["IR"],"is_corresponding":true,"raw_author_name":"Mahdi Naghibi","raw_affiliation_strings":["Faculty of Electrical and Computer Engineering, Malek-Ashtar University of Technology, Iran"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Electrical and Computer Engineering, Malek-Ashtar University of Technology, Iran","institution_ids":["https://openalex.org/I78323350"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000198628","display_name":"Reza Anvari","orcid":null},"institutions":[{"id":"https://openalex.org/I78323350","display_name":"Malek Ashtar University of Technology","ror":"https://ror.org/0043ezw98","country_code":"IR","type":"education","lineage":["https://openalex.org/I78323350"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Reza Anvari","raw_affiliation_strings":["Faculty of Electrical and Computer Engineering, Malek-Ashtar University of Technology, Iran"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Electrical and Computer Engineering, Malek-Ashtar University of Technology, Iran","institution_ids":["https://openalex.org/I78323350"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031513984","display_name":"Ali Forghani","orcid":"https://orcid.org/0000-0002-1628-7718"},"institutions":[{"id":"https://openalex.org/I78323350","display_name":"Malek Ashtar University of Technology","ror":"https://ror.org/0043ezw98","country_code":"IR","type":"education","lineage":["https://openalex.org/I78323350"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Ali Forghani","raw_affiliation_strings":["Faculty of Electrical and Computer Engineering, Malek-Ashtar University of Technology, Iran"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Electrical and Computer Engineering, Malek-Ashtar University of Technology, Iran","institution_ids":["https://openalex.org/I78323350"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057087345","display_name":"Behrouz Minaei\u2010Bidgoli","orcid":"https://orcid.org/0000-0002-9327-7345"},"institutions":[{"id":"https://openalex.org/I67009956","display_name":"Iran University of Science and Technology","ror":"https://ror.org/01jw2p796","country_code":"IR","type":"education","lineage":["https://openalex.org/I67009956"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Behrouz Minaei","raw_affiliation_strings":["Department of Computer Engineering, Iran University of Science and Technology, Iran","E-mail:","Fax: +98 21 22935341"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Iran University of Science and Technology, Iran","institution_ids":["https://openalex.org/I67009956"]},{"raw_affiliation_string":"E-mail:","institution_ids":[]},{"raw_affiliation_string":"Fax: +98 21 22935341","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5021247287"],"corresponding_institution_ids":["https://openalex.org/I78323350"],"apc_list":null,"apc_paid":null,"fwci":0.6372,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72270289,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"26","issue":"3","first_page":"695","last_page":"722"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9532999992370605,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8294017314910889},{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.7941474914550781},{"id":"https://openalex.org/keywords/web-crawler","display_name":"Web crawler","score":0.699384331703186},{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.6413995623588562},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.49298474192619324},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.45837026834487915},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.4378063678741455},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4365730285644531},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4315893352031708},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4156107008457184},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.35226207971572876}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8294017314910889},{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.7941474914550781},{"id":"https://openalex.org/C13743948","wikidata":"https://www.wikidata.org/wiki/Q45842","display_name":"Web crawler","level":2,"score":0.699384331703186},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.6413995623588562},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49298474192619324},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.45837026834487915},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.4378063678741455},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4365730285644531},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4315893352031708},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4156107008457184},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.35226207971572876},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/ida-205107","is_oa":false,"landing_page_url":"https://doi.org/10.3233/ida-205107","pdf_url":null,"source":{"id":"https://openalex.org/S2498839158","display_name":"Intelligent Data Analysis","issn_l":"1088-467X","issn":["1088-467X","1571-4128"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Intelligent Data Analysis","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1638427","https://openalex.org/W1489992655","https://openalex.org/W1503924817","https://openalex.org/W1963959122","https://openalex.org/W1974000536","https://openalex.org/W1978047987","https://openalex.org/W2001832505","https://openalex.org/W2001834587","https://openalex.org/W2005579877","https://openalex.org/W2017224880","https://openalex.org/W2030035054","https://openalex.org/W2044743392","https://openalex.org/W2045998703","https://openalex.org/W2098162425","https://openalex.org/W2102942431","https://openalex.org/W2107585977","https://openalex.org/W2116224704","https://openalex.org/W2133990480","https://openalex.org/W2140204390","https://openalex.org/W2145955964","https://openalex.org/W2151007976","https://openalex.org/W2151809999","https://openalex.org/W2157316480","https://openalex.org/W2160231803","https://openalex.org/W2165612380","https://openalex.org/W2567850235","https://openalex.org/W2568920572","https://openalex.org/W2571327869","https://openalex.org/W2611540330","https://openalex.org/W2748812704","https://openalex.org/W2771401735","https://openalex.org/W2798451772","https://openalex.org/W2803480040","https://openalex.org/W2894382219","https://openalex.org/W2948236829","https://openalex.org/W2949054060","https://openalex.org/W2963942219","https://openalex.org/W4206649294","https://openalex.org/W4235996464","https://openalex.org/W4236362309","https://openalex.org/W4236503510","https://openalex.org/W6600855501","https://openalex.org/W6731125637"],"related_works":["https://openalex.org/W1506122440","https://openalex.org/W2120136770","https://openalex.org/W1673346501","https://openalex.org/W2042201515","https://openalex.org/W2783570127","https://openalex.org/W2161927007","https://openalex.org/W3216588747","https://openalex.org/W2051135816","https://openalex.org/W2548298479","https://openalex.org/W4300913644"],"abstract_inverted_index":{"Access":[0],"to":[1,73,76],"one":[2],"of":[3,79,86,95,98,115,119,126,138,143,153,171,176,181,200,206,213],"the":[4,9,11,35,46,53,70,77,83,87,107,110,113,117,124,131,136,139,144,159,165,169,172,197,204,211,214],"richest":[5],"data":[6,27,43],"sources":[7],"in":[8,26,112,130,164,187],"world,":[10],"web,":[12],"is":[13,21,147],"not":[14,22],"possible":[15],"without":[16],"cost.":[17,55],"Often,":[18],"this":[19,31],"cost":[20],"taken":[23],"into":[24],"account":[25],"acquisition":[28,44],"processes.":[29],"In":[30],"paper,":[32],"we":[33],"introduce":[34],"Learning":[36],"Agents":[37],"(LA)":[38],"method":[39,59,146],"for":[40,102,122,157,179],"automatic":[41],"topical":[42,63,154,207],"from":[45],"web":[47,80],"with":[48],"minimum":[49],"bandwidth":[50],"usage":[51],"and":[52,90,134,209],"lowest":[54],"The":[56,65,161],"proposed":[57],"LA":[58,71,108,145,167,201],"uses":[60,150],"online":[61,66],"learning":[62,67,162,198],"crawlers.":[64,140],"capability":[68,199],"makes":[69],"able":[72],"dynamically":[74],"adapt":[75],"properties":[78],"pages":[81,180],"during":[82],"crawling":[84],"process":[85],"target":[88],"topic,":[89],"learn":[91],"an":[92],"effective":[93],"combination":[94],"a":[96,128,151],"set":[97],"link":[99,177],"scoring":[100,158],"criteria":[101,121],"that":[103,149,191],"topic.":[104],"That":[105],"way,":[106],"resolves":[109,168],"challenge":[111,170],"mechanism":[114],"combining":[116],"outputs":[118],"different":[120,182],"computing":[123],"value":[125],"following":[127],"link,":[129],"formerly":[132],"approaches,":[133],"increases":[135,203],"efficiency":[137,205],"A":[141],"version":[142],"implemented":[148,166],"collection":[152],"content":[155],"analyzers":[156],"links.":[160],"ability":[163],"unclear":[173],"appropriate":[174],"size":[175],"contexts":[178],"topics.":[183],"Using":[184],"standard":[185],"metrics":[186],"empirical":[188],"evaluation":[189],"indicates":[190],"when":[192],"non-learning":[193],"methods":[194],"show":[195],"inefficiency,":[196],"significantly":[202],"crawling,":[208],"achieves":[210],"state":[212],"art":[215],"results.":[216]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
