{"id":"https://openalex.org/W2146227473","doi":"https://doi.org/10.1155/2009/856037","title":"Profile-Based Focused Crawling for Social Media-Sharing Websites","display_name":"Profile-Based Focused Crawling for Social Media-Sharing Websites","publication_year":2009,"publication_date":"2009-01-01","ids":{"openalex":"https://openalex.org/W2146227473","doi":"https://doi.org/10.1155/2009/856037","mag":"2146227473"},"language":"en","primary_location":{"id":"doi:10.1155/2009/856037","is_oa":true,"landing_page_url":"https://doi.org/10.1155/2009/856037","pdf_url":null,"source":{"id":"https://openalex.org/S153767265","display_name":"EURASIP Journal on Image and Video Processing","issn_l":"1687-5176","issn":["1687-5176","1687-5281"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Image and Video Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1155/2009/856037","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100352621","display_name":"Zhiyong Zhang","orcid":"https://orcid.org/0000-0003-3061-7768"},"institutions":[{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhiyong Zhang","raw_affiliation_strings":["Department of Computer Engineering and Computer Sciences, University of Louisville, Louisville, KY"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering and Computer Sciences, University of Louisville, Louisville, KY","institution_ids":["https://openalex.org/I142740786"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049581991","display_name":"Olfa Nasraoui","orcid":"https://orcid.org/0000-0003-0999-5385"},"institutions":[{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Olfa Nasraoui","raw_affiliation_strings":["Department of Computer Engineering and Computer Sciences, University of Louisville, Louisville, KY"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering and Computer Sciences, University of Louisville, Louisville, KY","institution_ids":["https://openalex.org/I142740786"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100352621"],"corresponding_institution_ids":["https://openalex.org/I142740786"],"apc_list":{"value":1140,"currency":"GBP","value_usd":1398},"apc_paid":{"value":1140,"currency":"GBP","value_usd":1398},"fwci":1.5557,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.8955058,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2009","issue":null,"first_page":"1","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.95660001039505,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.8297927379608154},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.7664831876754761},{"id":"https://openalex.org/keywords/biometrics","display_name":"Biometrics","score":0.6972235441207886},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.5412899851799011},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5394358038902283},{"id":"https://openalex.org/keywords/internet-privacy","display_name":"Internet privacy","score":0.38564690947532654},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.33514660596847534},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26512932777404785},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.12128391861915588}],"concepts":[{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.8297927379608154},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.7664831876754761},{"id":"https://openalex.org/C184297639","wikidata":"https://www.wikidata.org/wiki/Q177765","display_name":"Biometrics","level":2,"score":0.6972235441207886},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.5412899851799011},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5394358038902283},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.38564690947532654},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.33514660596847534},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26512932777404785},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.12128391861915588},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1155/2009/856037","is_oa":true,"landing_page_url":"https://doi.org/10.1155/2009/856037","pdf_url":null,"source":{"id":"https://openalex.org/S153767265","display_name":"EURASIP Journal on Image and Video Processing","issn_l":"1687-5176","issn":["1687-5176","1687-5281"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Image and Video Processing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:461d85cbd6ee4b4c978f74a0f268b3a4","is_oa":true,"landing_page_url":"https://doaj.org/article/461d85cbd6ee4b4c978f74a0f268b3a4","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EURASIP Journal on Image and Video Processing, Vol 2009 (2009)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1155/2009/856037","is_oa":true,"landing_page_url":"https://doi.org/10.1155/2009/856037","pdf_url":null,"source":{"id":"https://openalex.org/S153767265","display_name":"EURASIP Journal on Image and Video Processing","issn_l":"1687-5176","issn":["1687-5176","1687-5281"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Image and Video Processing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1489992655","https://openalex.org/W1978047987","https://openalex.org/W2005579877","https://openalex.org/W2012575882","https://openalex.org/W2017224880","https://openalex.org/W2037600449","https://openalex.org/W2045986835","https://openalex.org/W2051833850","https://openalex.org/W2066309116","https://openalex.org/W2076008912","https://openalex.org/W2100612254","https://openalex.org/W2104086170","https://openalex.org/W2119577990","https://openalex.org/W2124673015","https://openalex.org/W2128915886","https://openalex.org/W2140077965","https://openalex.org/W2143309843","https://openalex.org/W2150721933","https://openalex.org/W2151007976","https://openalex.org/W2158601853"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4321258516","https://openalex.org/W2051833850","https://openalex.org/W4287845917","https://openalex.org/W3156164993","https://openalex.org/W2385015894","https://openalex.org/W2171573941","https://openalex.org/W4317382653","https://openalex.org/W3119324922","https://openalex.org/W2089702591"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,36,70,92,149,173],"novel":[3],"profile-based":[4,167],"focused":[5,90,168],"crawling":[6,31,68,190],"system":[7],"for":[8,28,76,88,101,120,152,194],"dealing":[9],"with":[10],"the":[11,22,30,48,59,67,89,113,138,163,191],"increasingly":[12],"popular":[13],"social":[14,61,77],"media-sharing":[15,78],"websites.":[16,79],"In":[17,63,80],"this":[18],"system,":[19],"we":[20,34,124],"treat":[21],"user":[23],"profiles":[24],"as":[25,170,172],"ranking":[26,151],"criteria":[27],"guiding":[29],"process.":[32],"Furthermore,":[33],"divide":[35],"user&#x00027;s":[37,49,60],"profile":[38,108],"into":[39],"two":[40,195],"parts,":[41],"an":[42,53],"internal":[43],"part,":[44,55],"which":[45,56],"comes":[46,57],"from":[47,58,141],"own":[50],"contribution,":[51],"and":[52,84,107,131,146,182],"external":[54],"contacts.":[62],"order":[64,81,135],"to":[65,82,126,136,180],"expand":[66],"topic,":[69],"cotagging":[71],"topic-discovery":[72],"scheme":[73],"was":[74],"adopted":[75],"efficiently":[83],"effectively":[85],"extract":[86,137],"data":[87],"crawling,":[91,122],"path":[93],"string-based":[94],"page":[95,117,184],"classification":[96],"method":[97],"is":[98,118,156],"first":[99],"developed":[100],"identifying":[102],"list":[103],"pages,":[104,106],"detail":[105,132],"pages.":[109],"The":[110],"identification":[111],"of":[112,116,144,165],"correct":[114,139],"type":[115,143],"essential":[119],"our":[121,166],"since":[123],"want":[125],"distinguish":[127],"between":[128],"list,":[129],"profile,":[130],"pages":[133],"in":[134,176],"information":[140],"each":[142,153],"page,":[145],"subsequently":[147],"estimate":[148],"reasonable":[150],"link":[154],"that":[155],"encountered":[157],"while":[158],"crawling.":[159],"Our":[160],"experiments":[161],"prove":[162],"robustness":[164],"crawler,":[169],"well":[171],"significant":[174],"improvement":[175],"harvest":[177],"ratio,":[178],"compared":[179],"breadth-first":[181],"online":[183],"importance":[185],"computation":[186],"(OPIC)":[187],"crawlers,":[188],"when":[189],"Flickr":[192],"website":[193],"different":[196],"topics.":[197]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
