{"id":"https://openalex.org/W2753318643","doi":"https://doi.org/10.3115/v1/w14-3401","title":"Natural Language Processing Methods for Enhancing Geographic Metadata for Phylogeography of Zoonotic Viruses","display_name":"Natural Language Processing Methods for Enhancing Geographic Metadata for Phylogeography of Zoonotic Viruses","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2753318643","doi":"https://doi.org/10.3115/v1/w14-3401","mag":"2753318643"},"language":"en","primary_location":{"id":"doi:10.3115/v1/w14-3401","is_oa":false,"landing_page_url":"https://doi.org/10.3115/v1/w14-3401","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of BioNLP 2014","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038933482","display_name":"Tasnia Tahsin","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tasnia Tahsin","raw_affiliation_strings":["Arizona State University**"],"affiliations":[{"raw_affiliation_string":"Arizona State University**","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032738234","display_name":"Robert Rivera","orcid":"https://orcid.org/0000-0003-1511-9517"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robert Rivera","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111972769","display_name":"R. Suzanne Beard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rachel Beard","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034935918","display_name":"Rob Lauder","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rob Lauder","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040948702","display_name":"Davy Weissenbacher","orcid":"https://orcid.org/0000-0001-8331-3675"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Davy Weissenbacher","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050090926","display_name":"Matthew Scotch","orcid":"https://orcid.org/0000-0001-5100-9724"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Matthew Scotch","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031917808","display_name":"Garrick Wallstrom","orcid":"https://orcid.org/0000-0002-5202-6742"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Garrick Wallstrom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5022014033","display_name":"Graciela Gonzalez\u2010Hernandez","orcid":"https://orcid.org/0000-0002-6416-9556"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Graciela Gonzalez","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5038933482"],"corresponding_institution_ids":["https://openalex.org/I55732556"],"apc_list":null,"apc_paid":null,"fwci":0.9258,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80513114,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12492","display_name":"Zoonotic diseases and public health","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T12492","display_name":"Zoonotic diseases and public health","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12047","display_name":"Viral Infections and Vectors","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/2725","display_name":"Infectious Diseases"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11135","display_name":"Virology and Viral Diseases","score":0.9825999736785889,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.7956188917160034},{"id":"https://openalex.org/keywords/genbank","display_name":"GenBank","score":0.7130385637283325},{"id":"https://openalex.org/keywords/phylogeography","display_name":"Phylogeography","score":0.6663568615913391},{"id":"https://openalex.org/keywords/geospatial-metadata","display_name":"Geospatial metadata","score":0.6033654808998108},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.569115400314331},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.4290747046470642},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.34193649888038635},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.2985716760158539},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.17856526374816895},{"id":"https://openalex.org/keywords/data-element","display_name":"Data element","score":0.1758396029472351},{"id":"https://openalex.org/keywords/phylogenetics","display_name":"Phylogenetics","score":0.11915183067321777},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.0858510434627533}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.7956188917160034},{"id":"https://openalex.org/C79029880","wikidata":"https://www.wikidata.org/wiki/Q901755","display_name":"GenBank","level":3,"score":0.7130385637283325},{"id":"https://openalex.org/C94043034","wikidata":"https://www.wikidata.org/wiki/Q377756","display_name":"Phylogeography","level":4,"score":0.6663568615913391},{"id":"https://openalex.org/C193150823","wikidata":"https://www.wikidata.org/wiki/Q1477538","display_name":"Geospatial metadata","level":5,"score":0.6033654808998108},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.569115400314331},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.4290747046470642},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.34193649888038635},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.2985716760158539},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.17856526374816895},{"id":"https://openalex.org/C30872290","wikidata":"https://www.wikidata.org/wiki/Q1172389","display_name":"Data element","level":3,"score":0.1758396029472351},{"id":"https://openalex.org/C90132467","wikidata":"https://www.wikidata.org/wiki/Q171184","display_name":"Phylogenetics","level":3,"score":0.11915183067321777},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0858510434627533},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C136976847","wikidata":"https://www.wikidata.org/wiki/Q6822297","display_name":"Meta Data Services","level":4,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3115/v1/w14-3401","is_oa":false,"landing_page_url":"https://doi.org/10.3115/v1/w14-3401","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of BioNLP 2014","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7200000286102295,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1555476426","https://openalex.org/W1967638266","https://openalex.org/W2022377934","https://openalex.org/W2052086812","https://openalex.org/W2068930226","https://openalex.org/W2088267428","https://openalex.org/W2100627415","https://openalex.org/W2107005506","https://openalex.org/W2128512278","https://openalex.org/W2130362098","https://openalex.org/W2134933826","https://openalex.org/W2156804059","https://openalex.org/W2171772603","https://openalex.org/W2182152229","https://openalex.org/W2251758222"],"related_works":["https://openalex.org/W2373398412","https://openalex.org/W2374379029","https://openalex.org/W2351854916","https://openalex.org/W2359241271","https://openalex.org/W1503116306","https://openalex.org/W4251339169","https://openalex.org/W1980255893","https://openalex.org/W1029779541","https://openalex.org/W1625276278","https://openalex.org/W2018424284"],"abstract_inverted_index":{"Zoonotic":[0],"viruses,":[1],"viruses":[2,35,55,87],"that":[3,15,190,208],"are":[4,62],"transmittable":[5],"between":[6],"animals":[7],"and":[8,50,58],"humans,":[9],"represent":[10],"emerging":[11],"or":[12],"re-emerging":[13],"pathogens":[14],"pose":[16],"significant":[17],"public":[18],"health":[19],"threats":[20],"throughout":[21],"the":[22,48,73,92,107,145,154,182,196],"world.":[23],"It":[24],"is":[25,88],"therefore":[26],"crucial":[27],"to":[28,46,143,194],"advance":[29],"current":[30],"surveillance":[31],"mechanisms":[32],"for":[33,131,147,163],"these":[34,54,86,112],"through":[36],"outlets":[37],"such":[38,69,148],"as":[39,70],"phylogeography.":[40],"Phylogeographic":[41],"techniques":[42],"may":[43,102,179],"be":[44,104,192],"applied":[45],"trace":[47],"origins":[49],"geographical":[51],"distribution":[52],"of":[53,75,85,94,116,156,185],"using":[56,135],"sequence":[57,78],"location":[59,205],"data,":[60],"which":[61,178],"often":[63,103],"obtained":[64],"from":[65,187],"publicly":[66],"available":[67],"databases":[68],"GenBank.":[71],"Despite":[72],"abundance":[74],"zoonotic":[76,166],"viral":[77],"data":[79],"in":[80,106,111,181,211],"GenBank":[81,157,197],"records,":[82,113],"phylogeographic":[83],"analysis":[84],"greatly":[89],"limited":[90],"by":[91],"lack":[93],"adequate":[95],"geographic":[96,161,198],"metadata.":[97,199],"Although":[98],"more":[99],"detailed":[100],"information":[101,118,134,186],"found":[105],"related":[108,188],"articles":[109,189],"referenced":[110],"manual":[114],"extraction":[115,184],"this":[117,124,133,212],"presents":[119],"a":[120,149,202],"severe":[121],"bottleneck.":[122],"In":[123,141],"work,":[125],"we":[126,151,209],"propose":[127],"an":[128],"automated":[129],"system":[130,207],"extracting":[132],"Natural":[136],"Language":[137],"Processing":[138],"(NLP)":[139],"methods.":[140],"order":[142],"validate":[144],"need":[146],"system,":[150],"first":[152],"determine":[153],"percentage":[155],"records":[158],"with":[159],"\u201cinsufficient\u201d":[160],"metadata":[162],"seven":[164],"well-studied":[165],"viruses.":[167],"We":[168],"then":[169],"evaluate":[170],"four":[171],"different":[172],"named":[173],"entity":[174],"recognition":[175],"(NER)":[176],"systems":[177],"help":[180],"automatic":[183],"can":[191],"used":[193],"improve":[195],"This":[200],"includes":[201],"novel":[203],"dictionary-based":[204],"tagging":[206],"introduce":[210],"paper.":[213]},"counts_by_year":[{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
