{"id":"https://openalex.org/W7131435902","doi":"https://doi.org/10.48550/arxiv.2602.18961","title":"Depth-Enhanced YOLO-SAM2 Detection for Reliable Ballast Insufficiency Identification","display_name":"Depth-Enhanced YOLO-SAM2 Detection for Reliable Ballast Insufficiency Identification","publication_year":2026,"publication_date":"2026-02-21","ids":{"openalex":"https://openalex.org/W7131435902","doi":"https://doi.org/10.48550/arxiv.2602.18961"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.18961","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.18961","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.18961","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126803325","display_name":"Shiyu Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Liu, Shiyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054697994","display_name":"D.G. Lester","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lester, Dylan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005801366","display_name":"Husnu S. Narman","orcid":"https://orcid.org/0000-0003-0788-6265"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Narman, Husnu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080165136","display_name":"Ammar Alzarrad","orcid":"https://orcid.org/0000-0002-6012-5679"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alzarrad, Ammar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126714353","display_name":"Pingping Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Pingping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5126803325"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10842","display_name":"Railway Engineering and Dynamics","score":0.6773999929428101,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10842","display_name":"Railway Engineering and Dynamics","score":0.6773999929428101,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.22849999368190765,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.019099999219179153,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ballast","display_name":"Ballast","score":0.727400004863739},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6157000064849854},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5759999752044678},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5275999903678894},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.42579999566078186},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.3817000091075897},{"id":"https://openalex.org/keywords/polynomial","display_name":"Polynomial","score":0.362199991941452}],"concepts":[{"id":"https://openalex.org/C125907379","wikidata":"https://www.wikidata.org/wiki/Q4851537","display_name":"Ballast","level":2,"score":0.727400004863739},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6157000064849854},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5759999752044678},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5472000241279602},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5321999788284302},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5302000045776367},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5275999903678894},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.42579999566078186},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.3817000091075897},{"id":"https://openalex.org/C90119067","wikidata":"https://www.wikidata.org/wiki/Q43260","display_name":"Polynomial","level":2,"score":0.362199991941452},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3521000146865845},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.35030001401901245},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.3492000102996826},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3488999903202057},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.335099995136261},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.2802000045776367},{"id":"https://openalex.org/C7305733","wikidata":"https://www.wikidata.org/wiki/Q207961","display_name":"Geometric shape","level":2,"score":0.2736000120639801},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.18961","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.18961","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.18961","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.18961","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,59,147],"depth-enhanced":[4,101],"YOLO-SAM2":[5,145],"framework":[6],"for":[7,65,90,153],"detecting":[8],"ballast":[9,88,156],"insufficiency":[10],"in":[11,159],"railway":[12,155],"tracks":[13],"using":[14,69],"RGB-D":[15,97],"data.":[16],"Although":[17],"YOLOv8":[18],"provides":[19],"reliable":[20,151],"localization,":[21],"the":[22,46,105],"RGB-only":[23],"model":[24],"shows":[25],"limited":[26],"safety":[27],"performance,":[28],"achieving":[29],"high":[30,126],"precision":[31],"(0.99)":[32],"but":[33],"low":[34],"recall":[35,120],"(0.49)":[36],"due":[37],"to":[38,44,124,134],"insufficient":[39,108],"ballast,":[40],"as":[41,125,127],"it":[42],"tends":[43],"over-predict":[45],"sufficient":[47],"class.":[48],"To":[49],"improve":[50,104],"reliability,":[51],"we":[52],"incorporate":[53],"depth-based":[54],"geometric":[55,91,118],"analysis":[56],"enabled":[57],"by":[58],"sleeper-aligned":[60],"depth-correction":[61],"pipeline":[62],"that":[63,100,140],"compensates":[64],"RealSense":[66],"spatial":[67],"distortion":[68],"polynomial":[70],"modeling,":[71],"RANSAC,":[72],"and":[73,87,117,129,150],"temporal":[74],"smoothing.":[75],"SAM2":[76],"segmentation":[77],"further":[78],"refines":[79],"region-of-interest":[80],"masks,":[81],"enabling":[82],"accurate":[83],"extraction":[84],"of":[85,107],"sleeper":[86],"profiles":[89],"classification.":[92],"Experiments":[93],"on":[94,111],"field-collected":[95],"top-down":[96],"data":[98],"show":[99],"configurations":[102],"substantially":[103],"detection":[106],"ballast.":[109],"Depending":[110],"bounding-box":[112],"sampling":[113],"(AABB":[114],"or":[115,162],"RBB)":[116],"criteria,":[119],"increases":[121],"from":[122,132],"0.49":[123],"0.80,":[128],"F1-score":[130],"improves":[131],"0.66":[133],"over":[135],"0.80.":[136],"These":[137],"results":[138],"demonstrate":[139],"integrating":[141],"depth":[142],"correction":[143],"with":[144],"yields":[146],"more":[148],"robust":[149],"approach":[152],"automated":[154],"inspection,":[157],"particularly":[158],"visually":[160],"ambiguous":[161],"safety-critical":[163],"scenarios.":[164]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-02-26T00:00:00"}
