{"id":"https://openalex.org/W3005049267","doi":"https://doi.org/10.1109/access.2020.3020868","title":"Generating Biomedical Question Answering Corpora From Q&amp;A Forums","display_name":"Generating Biomedical Question Answering Corpora From Q&amp;A Forums","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3005049267","doi":"https://doi.org/10.1109/access.2020.3020868","mag":"3005049267"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3020868","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3020868","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09184044.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09184044.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Andre Lamurias","orcid":"https://orcid.org/0000-0001-7965-6536"},"institutions":[{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Andre Lamurias","raw_affiliation_strings":["LASIGE, Faculdade de Ci\u00eancias, Universidade de Lisboa, Lisbon, Portugal"],"affiliations":[{"raw_affiliation_string":"LASIGE, Faculdade de Ci\u00eancias, Universidade de Lisboa, Lisbon, Portugal","institution_ids":["https://openalex.org/I141596103"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Diana Sousa","orcid":"https://orcid.org/0000-0003-0597-9273"},"institutions":[{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Diana Sousa","raw_affiliation_strings":["LASIGE, Faculdade de Ci\u00eancias, Universidade de Lisboa, Lisbon, Portugal"],"affiliations":[{"raw_affiliation_string":"LASIGE, Faculdade de Ci\u00eancias, Universidade de Lisboa, Lisbon, Portugal","institution_ids":["https://openalex.org/I141596103"]}]},{"author_position":"last","author":{"id":null,"display_name":"Francisco M. Couto","orcid":"https://orcid.org/0000-0003-0627-1496"},"institutions":[{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Francisco M. Couto","raw_affiliation_strings":["LASIGE, Faculdade de Ci\u00eancias, Universidade de Lisboa, Lisbon, Portugal"],"affiliations":[{"raw_affiliation_string":"LASIGE, Faculdade de Ci\u00eancias, Universidade de Lisboa, Lisbon, Portugal","institution_ids":["https://openalex.org/I141596103"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I141596103"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.5438,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.72486795,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"8","issue":null,"first_page":"161042","last_page":"161051"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3456000089645386,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3456000089645386,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.22310000658035278,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.13819999992847443,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.8513000011444092},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6728000044822693},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.6096000075340271},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5133000016212463},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.43459999561309814},{"id":"https://openalex.org/keywords/questions-and-answers","display_name":"Questions and answers","score":0.38989999890327454},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.367900013923645},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.3517000079154968}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8632000088691711},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.8513000011444092},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6728000044822693},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6154000163078308},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.6096000075340271},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.592199981212616},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5339000225067139},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5133000016212463},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.43459999561309814},{"id":"https://openalex.org/C3019144022","wikidata":"https://www.wikidata.org/wiki/Q4124998","display_name":"Questions and answers","level":2,"score":0.38989999890327454},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.367900013923645},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3603000044822693},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3517000079154968},{"id":"https://openalex.org/C148524875","wikidata":"https://www.wikidata.org/wiki/Q6975395","display_name":"F1 score","level":2,"score":0.3402999937534332},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.322299987077713},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.32170000672340393},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.29420000314712524},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C2993776861","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Open domain","level":3,"score":0.2906999886035919},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.27559998631477356},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C2780656832","wikidata":"https://www.wikidata.org/wiki/Q796573","display_name":"Online discussion","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/access.2020.3020868","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3020868","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09184044.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2002.02375","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.02375","pdf_url":"https://arxiv.org/pdf/2002.02375","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:doaj.org/article:6c856978a1b648009336d94cc1c016e8","is_oa":true,"landing_page_url":"https://doaj.org/article/6c856978a1b648009336d94cc1c016e8","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 161042-161051 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3020868","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3020868","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09184044.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1759428316","display_name":null,"funder_award_id":"UIDP/00408/2020","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G2089664753","display_name":null,"funder_award_id":"UIDB/00408/2020","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G2987173697","display_name":null,"funder_award_id":"UIDP/","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G3272457656","display_name":null,"funder_award_id":"UIDB/","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G3284537356","display_name":null,"funder_award_id":"SFRH/B","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G4384961418","display_name":null,"funder_award_id":"PTDC/CCI-BIO/28685/2017","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G5454278309","display_name":null,"funder_award_id":"/2017","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G5818630289","display_name":null,"funder_award_id":"SFRH/BD/","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G6299983296","display_name":null,"funder_award_id":"PTDC/","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G724804869","display_name":null,"funder_award_id":"SFRH/","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G8608336858","display_name":null,"funder_award_id":"SFRH/BD/145221/2019","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"}],"funders":[{"id":"https://openalex.org/F4320334779","display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","ror":"https://ror.org/00snfqn58"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3005049267.pdf","grobid_xml":"https://content.openalex.org/works/W3005049267.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W1975143876","https://openalex.org/W1981208470","https://openalex.org/W2057415299","https://openalex.org/W2192410469","https://openalex.org/W2250539671","https://openalex.org/W2252143362","https://openalex.org/W2536015822","https://openalex.org/W2740815822","https://openalex.org/W2766284073","https://openalex.org/W2889414415","https://openalex.org/W2891113091","https://openalex.org/W2906722631","https://openalex.org/W2910490538","https://openalex.org/W2912924812","https://openalex.org/W2962977107","https://openalex.org/W2964012472","https://openalex.org/W2965826089","https://openalex.org/W2970482702","https://openalex.org/W2970986790","https://openalex.org/W3003693574","https://openalex.org/W3149154678","https://openalex.org/W6732201471","https://openalex.org/W6753061502","https://openalex.org/W6758691756"],"related_works":["https://openalex.org/W128392744","https://openalex.org/W1550833313","https://openalex.org/W105002793","https://openalex.org/W2119364316","https://openalex.org/W2915016798","https://openalex.org/W1561629270","https://openalex.org/W1749760625","https://openalex.org/W1594355641","https://openalex.org/W1581726712","https://openalex.org/W1595388086"],"abstract_inverted_index":{"Question":[0],"Answering":[1],"(QA)":[2],"is":[3],"a":[4,31,52,70,179,190],"natural":[5],"language":[6],"processing":[7],"task":[8],"that":[9,90,165,184,220],"aims":[10],"at":[11,238],"obtaining":[12,128],"relevant":[13],"answers":[14,89,170,223],"to":[15,33,38,54,125,174,188,202,233],"user":[16],"questions.":[17],"While":[18],"some":[19],"progress":[20],"has":[21],"been":[22],"made":[23],"in":[24],"this":[25],"area,":[26],"biomedical":[27],"questions":[28,85,130,176],"are":[29,171,214,236],"still":[30],"challenge":[32],"most":[34,74],"QA":[35,75,95],"approaches,":[36],"due":[37],"the":[39,42,84,87,107,118,138,147,155,166,175,204,208,230],"complexity":[40],"of":[41,47,73,113,140,149,157],"domain":[43],"and":[44,86,104,131,146,177,216,229],"limited":[45],"availability":[46],"training":[48],"sets.":[49],"We":[50,116,135],"present":[51],"method":[53],"automatically":[55],"extract":[56],"question-article":[57,108,133],"pairs":[58,109],"from":[59,81,207,217],"Q&A":[60],"web":[61],"forums,":[62,127],"which":[63],"can":[64,101,199],"be":[65,102,200],"used":[66,201,232],"for":[67],"document":[68,99,159],"retrieval,":[69],"crucial":[71],"step":[72],"systems.":[76],"The":[77,196,226],"proposed":[78,197],"framework":[79,124,198,231],"extracts":[80],"selected":[82],"forums":[83,210,219],"respective":[88],"contain":[91],"citations.":[92],"This":[93],"way,":[94],"systems":[96],"based":[97],"on":[98,151],"retrieval":[100,160],"developed":[103],"evaluated":[105,136],"using":[106,189],"annotated":[110,193],"by":[111,121,194],"users":[112],"these":[114],"forums.":[115],"generated":[117],"BiQA":[119,205,227],"corpus":[120,206,228],"applying":[122],"our":[123],"three":[126],"7,453":[129],"14,239":[132],"pairs.":[134],"how":[137],"number":[139,148],"articles":[141,167],"associated":[142],"with":[143,224],"each":[144,152],"question":[145],"votes":[150],"answer":[153],"affects":[154],"performance":[156,187],"baseline":[158],"approaches.":[161],"Also,":[162],"we":[163],"demonstrated":[164],"given":[168],"as":[169,211],"significantly":[172],"similar":[173,186],"trained":[178],"state-of-the-art":[180],"deep":[181],"learning":[182],"model":[183],"obtained":[185],"dataset":[191],"manually":[192],"experts.":[195],"update":[203],"same":[209],"new":[212],"posts":[213],"made,":[215],"other":[218],"support":[221],"their":[222],"documents.":[225],"generate":[234],"it":[235],"available":[237],"https://github.com/lasigeBioTM/BiQA.":[239]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2020-02-14T00:00:00"}
