{"id":"https://openalex.org/W4414688137","doi":"https://doi.org/10.1109/iccv51701.2025.00463","title":"RIPE: Reinforcement Learning on Unlabeled Image Pairs for Robust Keypoint Extraction","display_name":"RIPE: Reinforcement Learning on Unlabeled Image Pairs for Robust Keypoint Extraction","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4414688137","doi":"https://doi.org/10.1109/iccv51701.2025.00463"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.00463","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.04839","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075158019","display_name":"Johannes K\u00fcnzel","orcid":"https://orcid.org/0000-0002-3561-2758"},"institutions":[{"id":"https://openalex.org/I2800274787","display_name":"Fraunhofer Institute for Telecommunications, Heinrich Hertz Institute","ror":"https://ror.org/02tbr6331","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2800274787","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Johannes K\u00fcnzel","raw_affiliation_strings":["Fraunhofer Heinrich-Hertz-Institut, HHI,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Fraunhofer Heinrich-Hertz-Institut, HHI,Germany","institution_ids":["https://openalex.org/I2800274787"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074580099","display_name":"Anna Hilsmann","orcid":"https://orcid.org/0000-0002-2086-0951"},"institutions":[{"id":"https://openalex.org/I2800274787","display_name":"Fraunhofer Institute for Telecommunications, Heinrich Hertz Institute","ror":"https://ror.org/02tbr6331","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2800274787","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Anna Hilsmann","raw_affiliation_strings":["Fraunhofer Heinrich-Hertz-Institut, HHI,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Fraunhofer Heinrich-Hertz-Institut, HHI,Germany","institution_ids":["https://openalex.org/I2800274787"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009614926","display_name":"Peter Eisert","orcid":"https://orcid.org/0000-0001-8378-4805"},"institutions":[{"id":"https://openalex.org/I2800274787","display_name":"Fraunhofer Institute for Telecommunications, Heinrich Hertz Institute","ror":"https://ror.org/02tbr6331","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2800274787","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Peter Eisert","raw_affiliation_strings":["Fraunhofer Heinrich-Hertz-Institut, HHI,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Fraunhofer Heinrich-Hertz-Institut, HHI,Germany","institution_ids":["https://openalex.org/I2800274787"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5075158019"],"corresponding_institution_ids":["https://openalex.org/I2800274787"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.24065899,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4868","last_page":"4877"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9790999889373779,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9790999889373779,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9621000289916992,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9587000012397766,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7889000177383423},{"id":"https://openalex.org/keywords/extractor","display_name":"Extractor","score":0.7050999999046326},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5767999887466431},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5453000068664551},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.49410000443458557},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4869999885559082},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.45170000195503235},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.44020000100135803},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.412200003862381}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7889000177383423},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7269999980926514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7161999940872192},{"id":"https://openalex.org/C117978034","wikidata":"https://www.wikidata.org/wiki/Q5422192","display_name":"Extractor","level":2,"score":0.7050999999046326},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5767999887466431},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5453000068664551},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.49410000443458557},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4869999885559082},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.45170000195503235},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.44020000100135803},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4043000042438507},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.35749998688697815},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3368000090122223},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.3009999990463257},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.29580000042915344},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.29019999504089355},{"id":"https://openalex.org/C66905080","wikidata":"https://www.wikidata.org/wiki/Q17005494","display_name":"Binary classification","level":3,"score":0.2793000042438507},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.26460000872612},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2574000060558319},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2517000138759613}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.00463","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2507.04839","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.04839","pdf_url":"https://arxiv.org/pdf/2507.04839","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2507.04839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.04839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.04839","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.04839","pdf_url":"https://arxiv.org/pdf/2507.04839","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2163774768","display_name":null,"funder_award_id":"01IS2407A","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"}],"funders":[{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"introduce":[1],"RIPE,":[2],"an":[3,100],"innovative":[4],"reinforcement":[5],"learning-based":[6],"framework":[7],"for":[8,81],"weakly-supervised":[9],"training":[10,27,62],"of":[11,61,67,84,108],"a":[12,43,68,88,132],"keypoint":[13,73,137],"extractor":[14],"that":[15,29,118],"excels":[16],"in":[17,135],"both":[18],"detection":[19],"and":[20,71,139],"description":[21,83],"tasks.":[22],"In":[23],"contrast":[24],"to":[25,91,103,128],"conventional":[26],"regimes":[28],"depend":[30],"heavily":[31],"on":[32,114],"artificial":[33],"transformations,":[34],"pre-generated":[35],"models,":[36],"or":[37],"3D":[38],"data,":[39,63],"RIPE":[40,75,119],"requires":[41],"only":[42],"binary":[44],"label":[45],"indicating":[46],"whether":[47],"paired":[48],"images":[49],"represent":[50],"the":[51,59,65,77,82,85,105,109],"same":[52],"scene.":[53],"This":[54],"minimal":[55],"supervision":[56],"significantly":[57],"expands":[58],"pool":[60],"enabling":[64],"creation":[66],"highly":[69],"generalized":[70],"robust":[72,136],"extractor.":[74],"utilizes":[76],"encoder's":[78],"intermediate":[79],"layers":[80],"keypoints":[86],"with":[87],"hyper-column":[89],"approach":[90],"integrate":[92],"information":[93],"from":[94],"different":[95],"scales.":[96],"Additionally,":[97],"we":[98,145],"propose":[99],"auxiliary":[101],"loss":[102],"enhance":[104],"discriminative":[106],"capability":[107],"learned":[110],"descriptors.":[111],"Comprehensive":[112],"evaluations":[113],"standard":[115],"benchmarks":[116],"demonstrate":[117],"simplifies":[120],"data":[121],"preparation":[122],"while":[123],"achieving":[124],"competitive":[125],"performance":[126],"compared":[127],"state-of-the-art":[129],"techniques,":[130],"marking":[131],"significant":[133],"advancement":[134],"extraction":[138],"description.":[140],"To":[141],"support":[142],"further":[143],"research,":[144],"have":[146],"made":[147],"our":[148],"code":[149],"publicly":[150],"available":[151],"at":[152],"https://github.com/fraunhoferhhi/RIPE.":[153]},"counts_by_year":[],"updated_date":"2026-05-06T06:03:25.996018","created_date":"2025-10-10T00:00:00"}
