{"id":"https://openalex.org/W4241034228","doi":"https://doi.org/10.1109/icws.2004.1314749","title":"Web services for information extraction from the Web","display_name":"Web services for information extraction from the Web","publication_year":2004,"publication_date":"2004-01-01","ids":{"openalex":"https://openalex.org/W4241034228","doi":"https://doi.org/10.1109/icws.2004.1314749"},"language":"en","primary_location":{"id":"doi:10.1109/icws.2004.1314749","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icws.2004.1314749","pdf_url":null,"source":{"id":"https://openalex.org/S4363608934","display_name":"Proceedings. IEEE International Conference on Web Services, 2004.","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings. IEEE International Conference on Web Services, 2004.","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019037855","display_name":"B. Habegger","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165258","display_name":"Laboratoire d'informatique de Nantes Atlantique","ror":"https://ror.org/05487pd16","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I205703379","https://openalex.org/I4210127572","https://openalex.org/I4210159245","https://openalex.org/I4210165258","https://openalex.org/I97188460"]},{"id":"https://openalex.org/I97188460","display_name":"Nantes Universit\u00e9","ror":"https://ror.org/03gnr7b55","country_code":"FR","type":"education","lineage":["https://openalex.org/I97188460"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"B. Habegger","raw_affiliation_strings":["Laboratiore dInformatique de Nantes Atlantique, University of Nantes, Nantes, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratiore dInformatique de Nantes Atlantique, University of Nantes, Nantes, France","institution_ids":["https://openalex.org/I4210165258","https://openalex.org/I97188460"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022771618","display_name":"M. Quafafou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"M. Quafafou","raw_affiliation_strings":["Institut des Application Avanc\u00e9es de Internet, Marseilles, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institut des Application Avanc\u00e9es de Internet, Marseilles, France","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.53703704,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"17","issue":null,"first_page":"279","last_page":"286"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12601","display_name":"Web Applications and Data Management","score":0.9832000136375427,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8779193758964539},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.7106871008872986},{"id":"https://openalex.org/keywords/web-service","display_name":"Web service","score":0.6992048621177673},{"id":"https://openalex.org/keywords/web-modeling","display_name":"Web modeling","score":0.6645928025245667},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.6360929012298584},{"id":"https://openalex.org/keywords/static-web-page","display_name":"Static web page","score":0.6112263202667236},{"id":"https://openalex.org/keywords/mashup","display_name":"Mashup","score":0.5889759063720703},{"id":"https://openalex.org/keywords/data-web","display_name":"Data Web","score":0.5796562433242798},{"id":"https://openalex.org/keywords/web-navigation","display_name":"Web navigation","score":0.5378808975219727},{"id":"https://openalex.org/keywords/web-api","display_name":"Web API","score":0.5307174921035767},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5301785469055176},{"id":"https://openalex.org/keywords/web-standards","display_name":"Web standards","score":0.5297008156776428},{"id":"https://openalex.org/keywords/web-development","display_name":"Web development","score":0.5228293538093567},{"id":"https://openalex.org/keywords/web-mapping","display_name":"Web mapping","score":0.502068281173706},{"id":"https://openalex.org/keywords/ws-policy","display_name":"WS-Policy","score":0.4902799427509308},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.4350118041038513},{"id":"https://openalex.org/keywords/web-application-security","display_name":"Web application security","score":0.29845982789993286}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8779193758964539},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.7106871008872986},{"id":"https://openalex.org/C35578498","wikidata":"https://www.wikidata.org/wiki/Q193424","display_name":"Web service","level":2,"score":0.6992048621177673},{"id":"https://openalex.org/C130436687","wikidata":"https://www.wikidata.org/wiki/Q7978591","display_name":"Web modeling","level":3,"score":0.6645928025245667},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.6360929012298584},{"id":"https://openalex.org/C173576120","wikidata":"https://www.wikidata.org/wiki/Q2641220","display_name":"Static web page","level":4,"score":0.6112263202667236},{"id":"https://openalex.org/C196126337","wikidata":"https://www.wikidata.org/wiki/Q821080","display_name":"Mashup","level":4,"score":0.5889759063720703},{"id":"https://openalex.org/C162005631","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Data Web","level":3,"score":0.5796562433242798},{"id":"https://openalex.org/C61096286","wikidata":"https://www.wikidata.org/wiki/Q7978592","display_name":"Web navigation","level":3,"score":0.5378808975219727},{"id":"https://openalex.org/C127613066","wikidata":"https://www.wikidata.org/wiki/Q557770","display_name":"Web API","level":4,"score":0.5307174921035767},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5301785469055176},{"id":"https://openalex.org/C182321512","wikidata":"https://www.wikidata.org/wiki/Q1153289","display_name":"Web standards","level":3,"score":0.5297008156776428},{"id":"https://openalex.org/C79373723","wikidata":"https://www.wikidata.org/wiki/Q386275","display_name":"Web development","level":3,"score":0.5228293538093567},{"id":"https://openalex.org/C24733836","wikidata":"https://www.wikidata.org/wiki/Q649186","display_name":"Web mapping","level":4,"score":0.502068281173706},{"id":"https://openalex.org/C190515685","wikidata":"https://www.wikidata.org/wiki/Q749179","display_name":"WS-Policy","level":5,"score":0.4902799427509308},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.4350118041038513},{"id":"https://openalex.org/C59241245","wikidata":"https://www.wikidata.org/wiki/Q4781497","display_name":"Web application security","level":4,"score":0.29845982789993286}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icws.2004.1314749","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icws.2004.1314749","pdf_url":null,"source":{"id":"https://openalex.org/S4363608934","display_name":"Proceedings. IEEE International Conference on Web Services, 2004.","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings. IEEE International Conference on Web Services, 2004.","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1616576116","https://openalex.org/W1962632332","https://openalex.org/W2083330748","https://openalex.org/W2104086170","https://openalex.org/W2135479443","https://openalex.org/W2156049581","https://openalex.org/W6640771989","https://openalex.org/W6675573929","https://openalex.org/W6683209587"],"related_works":["https://openalex.org/W2111074577","https://openalex.org/W2756226611","https://openalex.org/W3114642817","https://openalex.org/W2147899997","https://openalex.org/W2552347367","https://openalex.org/W4231441891","https://openalex.org/W233028058","https://openalex.org/W141137031","https://openalex.org/W1908400262","https://openalex.org/W46003491"],"abstract_inverted_index":{"Extracting":[0],"information":[1,60,89,111,154,176,205,228],"from":[2,23],"the":[3,20,39,47,116,127,156,217,226,230,237,249],"Web":[4,44,53,91,113,120,150,178,207,255],"is":[5,130,192],"a":[6,25,31,43,77,145,197,213],"complex":[7],"task":[8,146],"with":[9],"different":[10,100],"components":[11],"which":[12,55,147,209],"can":[13,62,240],"either":[14],"be":[15,64,84,96,241],"generic":[16],"or":[17],"specific":[18,123],"to":[19,57,83,86,95,98,109,143,168,182,202,211,246],"task,":[21],"going":[22],"downloading":[24],"given":[26,78],"page,":[27],"following":[28],"links,":[29,221],"querying":[30,42,159],"Web-based":[32,214],"applications":[33,236],"via":[34,46],"an":[35,59,175,183,204],"HTML":[36],"form":[37],"and":[38,70,73,122,164,224,244,252],"HTTP":[40,162],"protocol,":[41,49],"service":[45,179,208],"SOAP":[48],"etc.":[50],"Therefore":[51],"building":[52],"services":[54,114,121],"proceed":[56],"executing":[58],"tasks":[61,102],"not":[63],"simply":[65],"hard":[66],"coded":[67],"(i.e.":[68],"written":[69],"compiled":[71],"once":[72],"for":[74],"all":[75,234],"in":[76],"programming":[79],"language).":[80],"In":[81,233],"order":[82],"able":[85,97],"build":[87],"flexible":[88],"extraction":[90,112,177,206],"Services":[92],"we":[93,140],"need":[94],"compose":[99],"sub":[101],"together.":[103],"We":[104],"propose":[105],"a,":[106],"XML-based":[107],"language":[108],"describe":[110,144,203],"as":[115,190],"compositions":[117],"of":[118,219],"existing":[119,184],"functions.":[124],"The":[125],"usefulness":[126],"proposed":[128],"framework":[129],"demonstrated":[131],"by":[132,158],"three":[133,235],"real":[134],"world":[135],"applications.":[136],"(1)":[137],"Search":[138],"engines:":[139],"show":[141],"how":[142,201],"queries":[148],"Google's":[149],"service,":[151],"retrieves":[152],"more":[153],"on":[155,229],"results":[157],"their":[160],"respective":[161],"servers,":[163],"filters":[165],"them":[166],"according":[167],"this":[169],"information.":[170],"(2)":[171],"E-commerce":[172],"sites":[173],":":[174],"giving":[180],"access":[181],"HTML-based":[185],"e-commerce":[186],"online":[187],"application":[188],"such":[189],"Amazon":[191],"built.":[193],"(3)":[194],"Patent":[195],"extraction:":[196],"last":[198],"example":[199],"shows":[200],"allows":[210],"query":[212],"application,":[215],"extract":[216,225],"set":[218],"result":[220,231],"follow":[222],"them,":[223],"needed":[227],"pages.":[232],"generated":[238],"description":[239],"easily":[242],"modified":[243],"completed":[245],"further":[247],"respond":[248],"user's":[250],"needs":[251],"create":[253],"value-added":[254],"services.":[256]},"counts_by_year":[{"year":2015,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
