{"id":"https://openalex.org/W7155410439","doi":"https://doi.org/10.1016/j.array.2026.100841","title":"End-to-end automation of email intelligence in OSINT workflows: Architecture and implementation","display_name":"End-to-end automation of email intelligence in OSINT workflows: Architecture and implementation","publication_year":2026,"publication_date":"2026-04-23","ids":{"openalex":"https://openalex.org/W7155410439","doi":"https://doi.org/10.1016/j.array.2026.100841"},"language":"en","primary_location":{"id":"doi:10.1016/j.array.2026.100841","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.array.2026.100841","pdf_url":null,"source":{"id":"https://openalex.org/S4210194039","display_name":"Array","issn_l":"2590-0056","issn":["2590-0056"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Array","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1016/j.array.2026.100841","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134377320","display_name":"Bengisu Aydemir","orcid":null},"institutions":[{"id":"https://openalex.org/I3125470973","display_name":"Istanbul Medipol University","ror":"https://ror.org/037jwzz50","country_code":"TR","type":"education","lineage":["https://openalex.org/I3125470973"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Bengisu Aydemir","raw_affiliation_strings":["Department of Computer Engineering, Istanbul Medipol University, Istanbul, Turkiye"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Istanbul Medipol University, Istanbul, Turkiye","institution_ids":["https://openalex.org/I3125470973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001184161","display_name":"Malek Malkawi","orcid":"https://orcid.org/0000-0002-6588-9184"},"institutions":[{"id":"https://openalex.org/I3125470973","display_name":"Istanbul Medipol University","ror":"https://ror.org/037jwzz50","country_code":"TR","type":"education","lineage":["https://openalex.org/I3125470973"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Malek Malkawi","raw_affiliation_strings":["Department of Computer Engineering, Istanbul Medipol University, Istanbul, Turkiye"],"raw_orcid":"https://orcid.org/0000-0002-6588-9184","affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Istanbul Medipol University, Istanbul, Turkiye","institution_ids":["https://openalex.org/I3125470973"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5134448449","display_name":"Reda Alhajj","orcid":null},"institutions":[{"id":"https://openalex.org/I168635309","display_name":"University of Calgary","ror":"https://ror.org/03yjb2x39","country_code":"CA","type":"education","lineage":["https://openalex.org/I168635309"]},{"id":"https://openalex.org/I177969490","display_name":"University of Southern Denmark","ror":"https://ror.org/03yrrjy16","country_code":"DK","type":"education","lineage":["https://openalex.org/I177969490"]},{"id":"https://openalex.org/I3125470973","display_name":"Istanbul Medipol University","ror":"https://ror.org/037jwzz50","country_code":"TR","type":"education","lineage":["https://openalex.org/I3125470973"]}],"countries":["CA","DK","TR"],"is_corresponding":false,"raw_author_name":"Reda Alhajj","raw_affiliation_strings":["Department of Computer Engineering, Istanbul Medipol University, Istanbul, Turkiye","Department of Computer Science, University of Calgary, Calgary, Canada","Department of Health Informatics, University of Southern Denmark, Odense, Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Istanbul Medipol University, Istanbul, Turkiye","institution_ids":["https://openalex.org/I3125470973"]},{"raw_affiliation_string":"Department of Computer Science, University of Calgary, Calgary, Canada","institution_ids":["https://openalex.org/I168635309"]},{"raw_affiliation_string":"Department of Health Informatics, University of Southern Denmark, Odense, Denmark","institution_ids":["https://openalex.org/I177969490"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5001184161"],"corresponding_institution_ids":["https://openalex.org/I3125470973"],"apc_list":{"value":1350,"currency":"USD","value_usd":1350},"apc_paid":{"value":1350,"currency":"USD","value_usd":1350},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.69603524,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":null,"first_page":"100841","last_page":"100841"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12203","display_name":"Mobile Agent-Based Network Management","score":0.09950000047683716,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12203","display_name":"Mobile Agent-Based Network Management","score":0.09950000047683716,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.07329999655485153,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.07010000199079514,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.5557000041007996},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.45809999108314514},{"id":"https://openalex.org/keywords/systems-architecture","display_name":"Systems architecture","score":0.3596999943256378},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.2851000130176544},{"id":"https://openalex.org/keywords/information-system","display_name":"Information system","score":0.2745000123977661}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5845999717712402},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.5557000041007996},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.45809999108314514},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3797000050544739},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.37130001187324524},{"id":"https://openalex.org/C98025372","wikidata":"https://www.wikidata.org/wiki/Q477538","display_name":"Systems architecture","level":3,"score":0.3596999943256378},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2953999936580658},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C180198813","wikidata":"https://www.wikidata.org/wiki/Q121182","display_name":"Information system","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2732999920845032},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2709999978542328},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2700999975204468},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.25690001249313354}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1016/j.array.2026.100841","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.array.2026.100841","pdf_url":null,"source":{"id":"https://openalex.org/S4210194039","display_name":"Array","issn_l":"2590-0056","issn":["2590-0056"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Array","raw_type":"journal-article"},{"id":"pmh:oai:sdu.dk:openaire/d29c5538-b8cb-43cc-8b66-c1662cf54649","is_oa":true,"landing_page_url":"https://portal.findresearcher.sdu.dk/da/publications/d29c5538-b8cb-43cc-8b66-c1662cf54649","pdf_url":null,"source":{"id":"https://openalex.org/S4306400424","display_name":"University of Southern Denmark Research Portal (University of Southern Denmark)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I177969490","host_organization_name":"University of Southern Denmark","host_organization_lineage":["https://openalex.org/I177969490"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Aydemir, B, Malkawi, M & Alhajj, R 2026, 'End-to-end automation of email intelligence in OSINT workflows : Architecture and implementation', Array, vol. 30, 100841. https://doi.org/10.1016/j.array.2026.100841","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1016/j.array.2026.100841","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.array.2026.100841","pdf_url":null,"source":{"id":"https://openalex.org/S4210194039","display_name":"Array","issn_l":"2590-0056","issn":["2590-0056"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Array","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2055051465","https://openalex.org/W2207590972","https://openalex.org/W3000208506","https://openalex.org/W4362554543","https://openalex.org/W4384498332"],"related_works":[],"abstract_inverted_index":{"Open":[0],"Source":[1],"Intelligence":[2],"(OSINT)":[3],"has":[4,357,432],"become":[5],"increasingly":[6],"important":[7],"in":[8,30,47,60,390,455],"cybersecurity,":[9,404],"digital":[10,208,410],"risk":[11,411],"assessment,":[12],"and":[13,56,97,108,118,144,169,187,210,217,255,261,272,297,311,332,344,351,363,374,382,409,416,445,457],"investigative":[14,407],"research":[15],"due":[16],"to":[17,58,192,204,399],"the":[18,82,109,123,174,199,202,224,262,308,376,429],"growing":[19],"volume":[20],"of":[21,111,201,220,264,307,370,386,419,428],"publicly":[22],"available":[23],"information.":[24],"Traditional":[25],"OSINT":[26,78,194,392],"tools":[27],"often":[28],"operate":[29],"silos,":[31],"focusing":[32],"on":[33,161,230,329],"narrow":[34],"tasks":[35],"such":[36,268],"as":[37,269],"domain":[38,83,225],"lookup":[39],"or":[40,62,155],"metadata":[41],"extraction,":[42],"which":[43],"limits":[44],"their":[45],"effectiveness":[46,427],"providing":[48],"comprehensive":[49],"intelligence.":[50],"Meanwhile,":[51],"manual":[52,380],"workflows":[53],"remain":[54],"time-consuming":[55],"prone":[57],"errors":[59],"large-scale":[61],"time-sensitive":[63],"scenarios.":[64],"To":[65],"address":[66,142],"these":[67],"challenges,":[68],"this":[69,244],"paper":[70],"presents":[71],"a":[72,127,178,289,298,361],"fully":[73,236],"automated":[74,237],"framework":[75,175,397],"for":[76,103,241,316],"email-focused":[77,242],"explicitly":[79],"scoped":[80],"at":[81,223,375],"level":[84,227],"rather":[85],"than":[86],"individual":[87,140],"mailbox":[88],"verification.":[89],"The":[90,274,319,355,395,426],"system":[91,203,356,431,453],"integrates":[92],"asynchronous":[93],"web":[94,252,352],"scraping,":[95,253],"DNS":[96,254],"WHOIS":[98,256],"queries,":[99,257],"MX":[100,258,313],"record":[101,259,314],"checks":[102],"domain-level":[104,135,317,339,440],"mail":[105],"infrastructure":[106,226],"validation,":[107,260],"analysis":[110,263,372],"email":[112,141,265],"authentication":[113,266],"protocols":[114,267],"including":[115,251,403],"SPF,":[116,270],"DKIM,":[117,271],"DMARC.":[119,273],"Unlike":[120],"conventional":[121],"approaches,":[122],"proposed":[124,240,396,430],"pipeline":[125,238,275],"incorporates":[126],"validation":[128,181,300,323,340,441],"mechanism":[129],"that":[130,173],"combines":[131],"real-time":[132,304,334],"harvesting":[133],"with":[134],"checks,":[136],"avoiding":[137],"assumptions":[138],"about":[139],"existence":[143],"thereby":[145],"improving":[146],"infrastructure-level":[147,180],"reliability":[148],"while":[149,183],"reducing":[150,327],"noise":[151],"from":[152,422],"duplicate,":[153],"role-based,":[154],"inactive":[156],"addresses.":[157],"Experimental":[158],"evaluations":[159,437],"conducted":[160],"17":[162],"domains":[163],"spanning":[164],"academic,":[165],"governmental,":[166],"corporate,":[167],"startup,":[168],"privacy-focused":[170],"providers":[171],"demonstrate":[172],"achieves":[176],"approximately":[177],"90%":[179],"rate,":[182],"maintaining":[184],"consistent":[185],"performance":[186],"competitive":[188],"execution":[189,443],"times":[190],"compared":[191],"existing":[193],"workflows.":[195,393],"These":[196,336],"results":[197],"highlight":[198],"potential":[200],"support":[205],"cybersecurity":[206],"operations,":[207],"forensics,":[209],"threat":[211,405],"intelligence":[212,222,278,421,458],"by":[213,293,413,438],"enabling":[214,333,414],"scalable,":[215],"ethical,":[216],"autonomous":[218],"reconnaissance":[219,249],"email-related":[221,420],"without":[228,280],"relying":[229],"intrusive":[231],"verification":[232,306],"techniques.":[233],"\u2022":[234,285,354,394,425],"A":[235],"is":[239],"OSINT;":[243],"involves":[245],"integrating":[246],"multiple":[247,400],"passive":[248],"techniques,":[250],"enables":[276,367],"end-to-end":[277],"extraction":[279],"requiring":[281],"interactive":[282],"user":[283],"input.":[284],"This":[286,366],"study":[287],"introduces":[288],"harvesting-based":[290],"approach":[291,320],"supported":[292],"context-aware":[294],"HTML":[295],"scraping":[296],"two-stage":[299],"mechanism,":[301],"namely,":[302],"(i)":[303],"data":[305,325,446],"discovered":[309],"addresses,":[310],"(ii)":[312],"lookups":[315],"validation.":[318],"performs":[321],"concurrent":[322],"during":[324],"acquisition,":[326],"reliance":[328],"third-party":[330],"APIs":[331],"processing.":[335],"mechanisms":[337],"improve":[338],"reliability,":[341],"reduce":[342],"noise,":[343],"enable":[345],"effective":[346],"correlation":[347],"between":[348],"metadata,":[349],"infrastructure,":[350],"presence.":[353],"been":[358,433],"implemented":[359],"using":[360],"modular":[362],"extensible":[364],"architecture.":[365],"seamless":[368],"integration":[369],"additional":[371],"modules":[373],"same":[377],"time":[378],"minimizes":[379],"effort":[381],"mitigates":[383],"common":[384],"sources":[385],"human":[387],"error":[388],"inherent":[389],"traditional":[391],"contributes":[398],"application":[401],"domains,":[402],"intelligence,":[406],"journalism,":[408],"monitoring,":[412],"reliable":[415],"scalable":[417],"discovery":[418],"public":[423],"sources.":[424],"demonstrated":[434],"through":[435],"experimental":[436],"measuring":[439],"performance,":[442],"time,":[444],"consistency":[447],"across":[448],"various":[449],"operational":[450],"scenarios,":[451],"indicating":[452],"improvements":[454],"efficiency":[456],"quality.":[459]},"counts_by_year":[],"updated_date":"2026-05-29T09:21:14.243279","created_date":"2026-04-24T00:00:00"}
