{"id":"https://openalex.org/W7138929138","doi":"https://doi.org/10.48550/arxiv.2603.16427","title":"Cross-modal learning for plankton recognition","display_name":"Cross-modal learning for plankton recognition","publication_year":2026,"publication_date":"2026-03-17","ids":{"openalex":"https://openalex.org/W7138929138","doi":"https://doi.org/10.48550/arxiv.2603.16427"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16427","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16427","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16427","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5117614234","display_name":"Joona Kareinen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kareinen, Joona","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092645137","display_name":"Veikka Immonen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Immonen, Veikka","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129815362","display_name":"Tuomas Eerola","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eerola, Tuomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033088568","display_name":"Lumi Haraguchi","orcid":"https://orcid.org/0000-0001-6307-1808"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haraguchi, Lumi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066670639","display_name":"Lasse Lensu","orcid":"https://orcid.org/0000-0002-7691-121X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lensu, Lasse","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079371152","display_name":"Kaisa Kraft","orcid":"https://orcid.org/0000-0001-6290-3887"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kraft, Kaisa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074298865","display_name":"Sanna Suikkanen","orcid":"https://orcid.org/0000-0002-0768-8149"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Suikkanen, Sanna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5018012580","display_name":"Heikki K\u00e4lvi\u00e4inen","orcid":"https://orcid.org/0000-0002-0790-6847"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"K\u00e4lvi\u00e4inen, Heikki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5117614234"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.14030000567436218,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.14030000567436218,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10032","display_name":"Marine and coastal ecosystems","score":0.13860000669956207,"subfield":{"id":"https://openalex.org/subfields/1910","display_name":"Oceanography"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12697","display_name":"Water Quality Monitoring Technologies","score":0.04360000044107437,"subfield":{"id":"https://openalex.org/subfields/2312","display_name":"Water Science and Technology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/plankton","display_name":"Plankton","score":0.8237000107765198},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.45899999141693115},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.445499986410141},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.4056999981403351},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.4043999910354614},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.39250001311302185},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.36239999532699585}],"concepts":[{"id":"https://openalex.org/C108469399","wikidata":"https://www.wikidata.org/wiki/Q25367","display_name":"Plankton","level":2,"score":0.8237000107765198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6137999892234802},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.525600016117096},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.45899999141693115},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.445499986410141},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.4056999981403351},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.4043999910354614},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.39250001311302185},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.36239999532699585},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.3409999907016754},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33090001344680786},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3003000020980835},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2987000048160553},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2980000078678131},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.28600001335144043},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.2833999991416931},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.27889999747276306},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16427","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16427","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16427","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16427","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,169],"paper":[1],"considers":[2],"self-supervised":[3,219],"cross-modal":[4],"coordination":[5],"as":[6,81],"a":[7,39,137,156,166,172,204],"strategy":[8],"enabling":[9],"utilization":[10],"of":[11,17,34,102,160,181,207],"multiple":[12],"modalities":[13,129],"and":[14,83,140,188],"large":[15,40],"volumes":[16],"unlabeled":[18],"plankton":[19,25,35,46,70,93,152,162],"data":[20,37,106],"to":[21,62,107],"build":[22],"models":[23],"for":[24,44,127],"recognition.":[26,94],"Automated":[27],"imaging":[28,71],"instruments":[29,72],"facilitate":[30],"the":[31,65,100,109,118,144,194,214],"continuous":[32],"collection":[33],"image":[36,47,74,139,187],"on":[38,51],"scale.":[41],"Current":[42],"methods":[43],"automatic":[45],"recognition":[48,173,199],"rely":[49],"primarily":[50],"supervised":[52],"approaches,":[53],"which":[54,86],"require":[55],"labeled":[56,158,208],"training":[57],"sets":[58],"that":[59,175,193,213],"are":[60,88],"labor-intensive":[61],"collect.":[63],"On":[64],"other":[66],"hand,":[67],"some":[68],"modern":[69],"complement":[73],"information":[75,134,183],"with":[76,165],"optical":[77],"measurement":[78,105],"data,":[79],"such":[80,104],"scatter":[82],"fluorescence":[84],"profiles,":[85],"currently":[87],"not":[89],"widely":[90],"utilized":[91],"in":[92],"In":[95],"this":[96],"work,":[97],"we":[98,124,154,211],"explore":[99],"possibility":[101],"using":[103,130],"guide":[108],"learning":[110],"process":[111],"without":[112],"requiring":[113,202],"manual":[114],"labeling.":[115],"Inspired":[116],"by":[117],"concepts":[119],"behind":[120],"Contrastive":[121],"Language-Image":[122],"Pre-training,":[123],"train":[125],"encoders":[126],"both":[128,186],"only":[131,203],"binary":[132],"supervisory":[133],"indicating":[135],"whether":[136],"given":[138],"profile":[141,189],"originate":[142],"from":[143,148,185],"same":[145],"particle":[146],"or":[147],"different":[149],"particles.":[150],"For":[151],"recognition,":[153],"employ":[155],"small":[157],"gallery":[159],"known":[161],"species":[163],"combined":[164],"$k$-NN":[167],"classifier.":[168],"approach":[170,215],"yields":[171],"model":[174],"is":[176],"inherently":[177],"multimodal,":[178],"i.e.,":[179],"capable":[180],"utilizing":[182],"extracted":[184],"data.":[190],"We":[191],"demonstrate":[192],"proposed":[195],"method":[196],"achieves":[197],"high":[198],"accuracy":[200],"while":[201],"minimal":[205],"number":[206],"images.":[209],"Furthermore,":[210],"show":[212],"outperforms":[216],"an":[217],"image-only":[218],"baseline.":[220],"Code":[221],"available":[222],"at":[223],"https://github.com/Jookare/cross-modal-plankton.":[224]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-20T00:00:00"}
