{"id":"https://openalex.org/W4407937106","doi":"https://doi.org/10.1109/tdsc.2025.3545771","title":"BERT-PhishFinder: A Robust Model for Accurate Phishing URL Detection With Optimized DistilBERT","display_name":"BERT-PhishFinder: A Robust Model for Accurate Phishing URL Detection With Optimized DistilBERT","publication_year":2025,"publication_date":"2025-02-25","ids":{"openalex":"https://openalex.org/W4407937106","doi":"https://doi.org/10.1109/tdsc.2025.3545771"},"language":"en","primary_location":{"id":"doi:10.1109/tdsc.2025.3545771","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tdsc.2025.3545771","pdf_url":null,"source":{"id":"https://openalex.org/S133795288","display_name":"IEEE Transactions on Dependable and Secure Computing","issn_l":"1545-5971","issn":["1545-5971","1941-0018","2160-9209"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Dependable and Secure Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088958040","display_name":"Ali Aljofey","orcid":"https://orcid.org/0000-0002-1494-5107"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ali Aljofey","raw_affiliation_strings":["Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-1494-5107","affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008579903","display_name":"Saifullahi Aminu Bello","orcid":null},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Saifullahi Aminu Bello","raw_affiliation_strings":["Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-5328-6469","affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066196985","display_name":"Jian L\u00fc","orcid":"https://orcid.org/0000-0003-4599-7281"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Lu","raw_affiliation_strings":["Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-4599-7281","affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"last","author":{"id":null,"display_name":"Chen Xu","orcid":"https://orcid.org/0000-0002-1271-0734"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Xu","raw_affiliation_strings":["Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-1271-0734","affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory of Advanced Machine Learning and Applications, College of Mathematics and Statistics, Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5088958040"],"corresponding_institution_ids":["https://openalex.org/I180726961"],"apc_list":null,"apc_paid":null,"fwci":34.7257,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.9965501,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"22","issue":"4","first_page":"4315","last_page":"4329"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7901203632354736},{"id":"https://openalex.org/keywords/phishing","display_name":"Phishing","score":0.6939841508865356},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4423828721046448},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.37708181142807007},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.258492112159729},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.21594402194023132}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7901203632354736},{"id":"https://openalex.org/C83860907","wikidata":"https://www.wikidata.org/wiki/Q135005","display_name":"Phishing","level":3,"score":0.6939841508865356},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4423828721046448},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.37708181142807007},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.258492112159729},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.21594402194023132},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tdsc.2025.3545771","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tdsc.2025.3545771","pdf_url":null,"source":{"id":"https://openalex.org/S133795288","display_name":"IEEE Transactions on Dependable and Secure Computing","issn_l":"1545-5971","issn":["1545-5971","1941-0018","2160-9209"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Dependable and Secure Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3105280189","display_name":null,"funder_award_id":"U21A20455","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6262497296","display_name":null,"funder_award_id":"12326619","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7972534515","display_name":null,"funder_award_id":"62372302","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1832693441","https://openalex.org/W2088227176","https://openalex.org/W2190286163","https://openalex.org/W2297844173","https://openalex.org/W2528865691","https://openalex.org/W2625935159","https://openalex.org/W2782609208","https://openalex.org/W2890718808","https://openalex.org/W2909737018","https://openalex.org/W2919115771","https://openalex.org/W2944669302","https://openalex.org/W2964635261","https://openalex.org/W2982692510","https://openalex.org/W2999357838","https://openalex.org/W3007485446","https://openalex.org/W3023514002","https://openalex.org/W3085804088","https://openalex.org/W3114349121","https://openalex.org/W3123603445","https://openalex.org/W3158143049","https://openalex.org/W3162677480","https://openalex.org/W3191442433","https://openalex.org/W4200587960","https://openalex.org/W4221129096","https://openalex.org/W4225454120","https://openalex.org/W4298008244","https://openalex.org/W4306953359","https://openalex.org/W4322487983","https://openalex.org/W4385245566","https://openalex.org/W4387668052","https://openalex.org/W6628877408","https://openalex.org/W6732691979","https://openalex.org/W6748384357","https://openalex.org/W6749825310","https://openalex.org/W6755207826","https://openalex.org/W6766673545","https://openalex.org/W6768021236","https://openalex.org/W6768851824","https://openalex.org/W6784333009","https://openalex.org/W6858039225"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2149202530","https://openalex.org/W2807822918","https://openalex.org/W2921723332","https://openalex.org/W4391093354","https://openalex.org/W2482950156","https://openalex.org/W4396966040","https://openalex.org/W2305322260"],"abstract_inverted_index":{"Phishing":[0],"URL":[1,72,154,160,194],"detection":[2,161,195],"has":[3],"become":[4],"a":[5,30,60,116],"critical":[6],"challenge":[7],"in":[8,86,157],"cybersecurity,":[9],"with":[10,91,138,200],"existing":[11,177],"methods":[12,178],"often":[13],"struggling":[14],"to":[15,37,66,100,114],"maintain":[16],"high":[17],"accuracy":[18],"while":[19],"generalizing":[20],"across":[21],"diverse":[22,147],"datasets.":[23],"In":[24],"this":[25,39,121,199],"article,":[26],"we":[27,82],"introduce":[28],"BERT-PhishFinder,":[29],"novel":[31],"and":[32,79,95,104,141,149,175],"efficient":[33],"transformer-based":[34],"model":[35,126],"designed":[36],"tackle":[38],"problem.":[40],"While":[41],"most":[42],"traditional":[43],"approaches":[44],"rely":[45],"heavily":[46],"on":[47,179],"lexical":[48],"features":[49,150],"or":[50],"complex":[51],"convolutional":[52],"architectures,":[53],"BERT-PhishFinder":[54,185],"leverages":[55],"the":[56,76,87,152,189],"power":[57],"of":[58,71],"DistilBERT,":[59],"lightweight":[61],"yet":[62],"highly":[63],"effective":[64],"transformer,":[65],"capture":[67],"rich":[68],"contextual":[69],"representations":[70,110],"sequences.":[73],"To":[74],"enhance":[75],"model\u2019s":[77],"robustness":[78],"reduce":[80],"overfitting,":[81],"strategically":[83],"incorporate":[84],"SpatialDropout1D":[85],"embedding":[88],"layers,":[89,136],"along":[90],"global":[92,96],"average":[93],"pooling":[94,98],"max":[97],"techniques":[99],"extract":[101],"both":[102],"comprehensive":[103,117],"key":[105],"discriminative":[106],"features.":[107],"The":[108],"pooled":[109],"are":[111],"thoughtfully":[112],"concatenated":[113],"form":[115],"feature":[118],"representation.":[119],"Through":[120],"carefully":[122],"crafted":[123],"design,":[124],"our":[125],"adopts":[127],"ensemble":[128],"learning,":[129],"as":[130],"it":[131],"undergoes":[132],"multiple":[133],"parallel":[134],"dense":[135],"each":[137],"distinct":[139],"parameters":[140],"dropout":[142],"regularization.":[143],"This":[144],"facilitates":[145],"learning":[146,168],"patterns":[148],"from":[151],"input":[153],"sequence,":[155],"culminating":[156],"exceptional":[158],"phishing":[159,193],"performance.":[162],"Extensive":[163],"evaluations":[164],"against":[165],"conventional":[166],"deep":[167],"algorithms,":[169],"transformer":[170],"models":[171],"(XLNet,":[172],"RoBERTa,":[173],"ALBERT),":[174],"other":[176],"five":[180],"benchmark":[181],"datasets":[182],"show":[183],"that":[184],"not":[186],"only":[187],"achieves":[188],"state":[190],"of-the-art":[191],"real":[192],"but":[196],"also":[197],"accomplishes":[198],"reduced":[201],"label":[202],"dependency.":[203]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":6}],"updated_date":"2026-05-31T08:46:17.908082","created_date":"2025-10-10T00:00:00"}
