{"id":"https://openalex.org/W4415124292","doi":"https://doi.org/10.48550/arxiv.2506.13027","title":"DETRPose: Real-time end-to-end transformer model for multi-person pose estimation","display_name":"DETRPose: Real-time end-to-end transformer model for multi-person pose estimation","publication_year":2025,"publication_date":"2025-06-16","ids":{"openalex":"https://openalex.org/W4415124292","doi":"https://doi.org/10.48550/arxiv.2506.13027"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2506.13027","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.13027","pdf_url":"https://arxiv.org/pdf/2506.13027","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2506.13027","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114414699","display_name":"Sebastian Janampa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Janampa, Sebastian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Pattichis, Marios","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pattichis, Marios","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.5856999754905701},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5503000020980835},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.550000011920929},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.435699999332428},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.374099999666214},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.3734000027179718}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5916000008583069},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5503000020980835},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5503000020980835},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.550000011920929},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.435699999332428},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.374099999666214},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3734000027179718},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34619998931884766},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32190001010894775},{"id":"https://openalex.org/C167928553","wikidata":"https://www.wikidata.org/wiki/Q1376021","display_name":"Estimation theory","level":2,"score":0.31839999556541443},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3147999942302704},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2500999867916107}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2506.13027","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.13027","pdf_url":"https://arxiv.org/pdf/2506.13027","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2506.13027","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2506.13027","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2506.13027","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.13027","pdf_url":"https://arxiv.org/pdf/2506.13027","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multi-person":[0],"pose":[1,54],"estimation":[2,55],"(MPPE)":[3],"estimates":[4],"keypoints":[5],"for":[6,18],"all":[7],"individuals":[8],"present":[9],"in":[10,21,38,56],"an":[11],"image.":[12],"MPPE":[13,37],"is":[14],"a":[15,44,61],"fundamental":[16],"task":[17],"several":[19],"applications":[20],"computer":[22],"vision":[23],"and":[24,65,73],"virtual":[25],"reality.":[26],"Unfortunately,":[27],"there":[28],"are":[29],"currently":[30],"no":[31],"transformer-based":[32,47],"models":[33,48,93,120],"that":[34],"can":[35],"perform":[36],"real":[39],"time.":[40],"The":[41],"paper":[42],"presents":[43],"family":[45],"of":[46,50,80],"capable":[49],"performing":[51],"multi-person":[52],"2D":[53],"real-time.":[57],"Our":[58],"approach":[59],"utilizes":[60],"modified":[62],"decoder":[63],"architecture":[64],"keypoint":[66],"similarity":[67],"metrics":[68],"to":[69,88,99,112],"generate":[70],"both":[71],"positive":[72],"negative":[74],"queries,":[75],"thereby":[76],"enhancing":[77],"the":[78,81,85,115],"quality":[79],"selected":[82],"queries":[83],"within":[84],"architecture.":[86],"Compared":[87],"state-of-the-art":[89],"models,":[90,127],"our":[91,118],"proposed":[92,119],"train":[94],"much":[95],"faster,":[96],"using":[97,129],"5":[98],"10":[100],"times":[101,107],"fewer":[102,131],"epochs,":[103],"with":[104],"competitive":[105,122],"inference":[106],"without":[108],"requiring":[109],"quantization":[110],"libraries":[111],"speed":[113],"up":[114],"model.":[116],"Furthermore,":[117],"provide":[121],"results":[123],"or":[124],"outperform":[125],"alternative":[126],"often":[128],"significantly":[130],"parameters.":[132]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-14T00:00:00"}
