{"id":"https://openalex.org/W3031676291","doi":"https://doi.org/10.1109/access.2020.2997907","title":"FLAG-PDFe: Features Oriented Metadata Extraction Framework for Scientific Publications","display_name":"FLAG-PDFe: Features Oriented Metadata Extraction Framework for Scientific Publications","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3031676291","doi":"https://doi.org/10.1109/access.2020.2997907","mag":"3031676291"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.2997907","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2997907","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09102282.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09102282.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082558873","display_name":"Muhammad Waqas Ahmed","orcid":"https://orcid.org/0000-0002-4563-8951"},"institutions":[{"id":"https://openalex.org/I4210088086","display_name":"Capital University of Science and Technology","ror":"https://ror.org/004776246","country_code":"PK","type":"education","lineage":["https://openalex.org/I4210088086"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Muhammad Waqas Ahmed","raw_affiliation_strings":["Department of Computer Science, Capital University of Science and Technology, Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Capital University of Science and Technology, Islamabad, Pakistan","institution_ids":["https://openalex.org/I4210088086"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108009280","display_name":"Muhammad Tanvir Afzal","orcid":"https://orcid.org/0000-0002-9765-8815"},"institutions":[{"id":"https://openalex.org/I4210088086","display_name":"Capital University of Science and Technology","ror":"https://ror.org/004776246","country_code":"PK","type":"education","lineage":["https://openalex.org/I4210088086"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Muhammad Tanvir Afzal","raw_affiliation_strings":["Department of Computer Science, Capital University of Science and Technology, Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Capital University of Science and Technology, Islamabad, Pakistan","institution_ids":["https://openalex.org/I4210088086"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5082558873"],"corresponding_institution_ids":["https://openalex.org/I4210088086"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.8793,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.75857028,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"8","issue":null,"first_page":"99458","last_page":"99469"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.8467789888381958},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8244684338569641},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.7144208550453186},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.612000584602356},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4455413222312927},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4416278600692749},{"id":"https://openalex.org/keywords/electronic-publishing","display_name":"Electronic publishing","score":0.4192129969596863},{"id":"https://openalex.org/keywords/publishing","display_name":"Publishing","score":0.41457802057266235},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.2894060015678406}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.8467789888381958},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8244684338569641},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.7144208550453186},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.612000584602356},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4455413222312927},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4416278600692749},{"id":"https://openalex.org/C18599908","wikidata":"https://www.wikidata.org/wiki/Q1196904","display_name":"Electronic publishing","level":3,"score":0.4192129969596863},{"id":"https://openalex.org/C151719136","wikidata":"https://www.wikidata.org/wiki/Q3972943","display_name":"Publishing","level":2,"score":0.41457802057266235},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.2894060015678406},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.2997907","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2997907","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09102282.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:268fb64774804b74a014664c85078515","is_oa":true,"landing_page_url":"https://doaj.org/article/268fb64774804b74a014664c85078515","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 99458-99469 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.2997907","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2997907","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09102282.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.5400000214576721,"display_name":"Partnerships for the goals"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320338370","display_name":"FP7 Information and Communication Technologies","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3031676291.pdf","grobid_xml":"https://content.openalex.org/works/W3031676291.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W791527587","https://openalex.org/W1015675232","https://openalex.org/W1530730108","https://openalex.org/W1559499673","https://openalex.org/W1597517899","https://openalex.org/W1768944425","https://openalex.org/W1907286193","https://openalex.org/W1943383135","https://openalex.org/W1966285711","https://openalex.org/W1976829395","https://openalex.org/W2034222664","https://openalex.org/W2061598441","https://openalex.org/W2079525773","https://openalex.org/W2082470640","https://openalex.org/W2101964309","https://openalex.org/W2110907671","https://openalex.org/W2113064181","https://openalex.org/W2118286367","https://openalex.org/W2121764873","https://openalex.org/W2140190241","https://openalex.org/W2147880316","https://openalex.org/W2166633748","https://openalex.org/W2168065722","https://openalex.org/W2171033594","https://openalex.org/W2171114275","https://openalex.org/W2295508865","https://openalex.org/W2335678039","https://openalex.org/W2513604820","https://openalex.org/W2528997906","https://openalex.org/W2529160902","https://openalex.org/W2529247374","https://openalex.org/W2533973874","https://openalex.org/W2559930789","https://openalex.org/W2612379105","https://openalex.org/W2794075952","https://openalex.org/W2803318469","https://openalex.org/W2918649722","https://openalex.org/W2974012318","https://openalex.org/W2989092762","https://openalex.org/W2990726790","https://openalex.org/W2994947658","https://openalex.org/W3106530750","https://openalex.org/W3159649695","https://openalex.org/W4299456266","https://openalex.org/W4383560187","https://openalex.org/W4400134761","https://openalex.org/W6633305578","https://openalex.org/W6637181481","https://openalex.org/W6638165513","https://openalex.org/W6682082992"],"related_works":["https://openalex.org/W2034429309","https://openalex.org/W4237533532","https://openalex.org/W2418907669","https://openalex.org/W2381066367","https://openalex.org/W4389948559","https://openalex.org/W2963110562","https://openalex.org/W2360824260","https://openalex.org/W2384486841","https://openalex.org/W2381765749","https://openalex.org/W2354149895"],"abstract_inverted_index":{"The":[0,149,261,274],"unprecedented":[1],"growth":[2],"of":[3,35,56,69,101,120,170,188,232,239,258,263,299],"the":[4,12,70,160,163,167,174,177,221,226,255,264,269,296,300],"research":[5,13,29,102,134,171,193],"publications":[6],"in":[7,38,85,137,220],"diversified":[8,125,211],"domains":[9],"has":[10,50,286],"overwhelmed":[11],"community.":[14],"It":[15],"requires":[16],"a":[17,36,39,107,133,144,288],"cumbersome":[18],"process":[19],"to":[20,78,115,182,208,224,253,295],"extract":[21,33,79,116,129,225,254],"this":[22],"enormous":[23],"information":[24,165],"by":[25,58],"manually":[26],"analyzing":[27],"these":[28,210],"documents.":[30,172],"To":[31,128],"automatically":[32],"content":[34,44,57,169],"document":[37],"structured":[40],"way,":[41],"metadata":[42,80,131,257],"and":[43,62,94,155,162,200,242,281],"must":[45],"be":[46,113],"annotated.":[47],"Scientific":[48],"community":[49],"been":[51],"focusing":[52],"on":[53,159,251,291],"automatic":[54],"extraction":[55],"forming":[59],"different":[60,64,184],"heuristics":[61,250],"applying":[63],"machine":[65,243],"learning":[66,244],"techniques.":[67],"One":[68],"renowned":[71],"conference":[72],"organizers,":[73],"ESWC":[74,301],"organizes":[75],"state-of-the-art":[76],"challenge":[77],"like":[81],"authors,":[82],"affiliations,":[83,86],"countries":[84],"supplementary":[87],"material,":[88],"sections,":[89],"table,":[90],"figures,":[91],"funding":[92],"agencies,":[93],"EU":[95],"funded":[96],"projects":[97],"from":[98,122,132,166],"PDF":[99],"files":[100],"articles.":[103],"We":[104,214],"have":[105,142],"proposed":[106],"feature":[108],"centric":[109],"technique":[110],"that":[111],"can":[112],"used":[114,181],"logical":[117,138,227],"layout":[118,139,186,201,228],"structure":[119,229],"articles":[121],"publishers":[123],"with":[124],"composition":[126],"styles.":[127],"unique":[130,197],"article":[135],"placed":[136],"structure,":[140],"we":[141,204,247],"developed":[143],"four-staged":[145],"novel":[146],"approach":[147,150,285,298],"\u201cFLAG-PDFe\u201d.":[148],"is":[151],"built":[152],"upon":[153],"distinct":[154,178],"generic":[156,206,240],"features":[157,179,207,241],"based":[158],"textual":[161],"geometric":[164],"raw":[168],"At":[173],"first":[175],"stage,":[176],"are":[180,266],"identify":[183],"physical":[185],"components":[187],"an":[189,233,259],"individual":[190],"article.":[191,260],"Since":[192],"journals":[194],"follow":[195],"their":[196],"publishing":[198,212],"styles":[199],"formats,":[202],"therefore,":[203],"develop":[205],"handle":[209],"patterns.":[213],"employ":[215],"support":[216],"vector":[217],"classification":[218],"(SVC)":[219],"third":[222],"stage":[223],"(LLS)/":[230],"sections":[231],"article,":[234],"after":[235],"performing":[236],"comprehensive":[237],"evaluation":[238],"models.":[245],"Finally,":[246],"further":[248],"apply":[249],"LLS":[252],"desired":[256],"outcomes":[262],"study":[265],"obtained":[267],"using":[268],"gold":[270],"standard":[271],"data":[272],"set.":[273],"results":[275],"yields":[276],"0.877":[277],"recall,":[278],"precision":[279],"0.928":[280],"0.897":[282],"F-measure.":[283],"Our":[284],"achieved":[287],"16%":[289],"gain":[290],"f-measure":[292],"when":[293],"compared":[294],"best":[297],"challenge.":[302]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
