{"id":"https://openalex.org/W2981335131","doi":"https://doi.org/10.1109/iros40897.2019.8968173","title":"Learning Q-network for Active Information Acquisition","display_name":"Learning Q-network for Active Information Acquisition","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W2981335131","doi":"https://doi.org/10.1109/iros40897.2019.8968173","mag":"2981335131"},"language":"en","primary_location":{"id":"doi:10.1109/iros40897.2019.8968173","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968173","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1910.10754","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068209902","display_name":"Heejin Jeong","orcid":"https://orcid.org/0000-0002-0122-532X"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Heejin Jeong","raw_affiliation_strings":["University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057774600","display_name":"Brent Schlotfeldt","orcid":"https://orcid.org/0000-0002-2016-6492"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brent Schlotfeldt","raw_affiliation_strings":["University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059354479","display_name":"Hamed Hassani","orcid":"https://orcid.org/0000-0002-9448-8750"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hamed Hassani","raw_affiliation_strings":["University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025946191","display_name":"Manfred Morari","orcid":"https://orcid.org/0000-0002-7696-5058"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Manfred Morari","raw_affiliation_strings":["University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007905483","display_name":"Daniel D. Lee","orcid":"https://orcid.org/0000-0002-2163-2686"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daniel D. Lee","raw_affiliation_strings":["Cornell University,department of Electrical and Computer Engineering,Ithaca,NY,USA,14850","Cornell University,Department of Electrical and Computer Engineering,Ithaca,NY,USA,14850"],"affiliations":[{"raw_affiliation_string":"Cornell University,department of Electrical and Computer Engineering,Ithaca,NY,USA,14850","institution_ids":["https://openalex.org/I205783295"]},{"raw_affiliation_string":"Cornell University,Department of Electrical and Computer Engineering,Ithaca,NY,USA,14850","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029243115","display_name":"George J. Pappas","orcid":"https://orcid.org/0000-0001-9081-0637"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"George J. Pappas","raw_affiliation_strings":["University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania,department of Electrical and Systems Engineering,Philadelphia,PA,USA,19104","institution_ids":["https://openalex.org/I79576946"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5068209902"],"corresponding_institution_ids":["https://openalex.org/I79576946"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13003007,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"6822","last_page":"6827"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9170677661895752},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7052574157714844},{"id":"https://openalex.org/keywords/time-horizon","display_name":"Time horizon","score":0.6308190822601318},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5127285718917847},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5077439546585083},{"id":"https://openalex.org/keywords/knowledge-acquisition","display_name":"Knowledge acquisition","score":0.4903440475463867},{"id":"https://openalex.org/keywords/maxima-and-minima","display_name":"Maxima and minima","score":0.4552844762802124},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4495851993560791},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.423668771982193},{"id":"https://openalex.org/keywords/information-theory","display_name":"Information theory","score":0.4161820113658905},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.2887069582939148},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11594203114509583}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9170677661895752},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7052574157714844},{"id":"https://openalex.org/C28761237","wikidata":"https://www.wikidata.org/wiki/Q7805321","display_name":"Time horizon","level":2,"score":0.6308190822601318},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5127285718917847},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5077439546585083},{"id":"https://openalex.org/C2777220311","wikidata":"https://www.wikidata.org/wiki/Q6423340","display_name":"Knowledge acquisition","level":2,"score":0.4903440475463867},{"id":"https://openalex.org/C186633575","wikidata":"https://www.wikidata.org/wiki/Q845060","display_name":"Maxima and minima","level":2,"score":0.4552844762802124},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4495851993560791},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.423668771982193},{"id":"https://openalex.org/C52622258","wikidata":"https://www.wikidata.org/wiki/Q131222","display_name":"Information theory","level":2,"score":0.4161820113658905},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2887069582939148},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11594203114509583},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iros40897.2019.8968173","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968173","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1910.10754","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1910.10754","pdf_url":"https://arxiv.org/pdf/1910.10754","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2981335131","is_oa":true,"landing_page_url":"https://arxiv.org/abs/1910.10754v1","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1910.10754","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1910.10754","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1910.10754","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1910.10754","pdf_url":"https://arxiv.org/pdf/1910.10754","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2981335131.pdf","grobid_xml":"https://content.openalex.org/works/W2981335131.grobid-xml"},"referenced_works_count":43,"referenced_works":["https://openalex.org/W637527836","https://openalex.org/W1594783240","https://openalex.org/W1757796397","https://openalex.org/W1977655452","https://openalex.org/W2032100464","https://openalex.org/W2087421501","https://openalex.org/W2093725709","https://openalex.org/W2098846072","https://openalex.org/W2105480835","https://openalex.org/W2113719290","https://openalex.org/W2116485803","https://openalex.org/W2121863487","https://openalex.org/W2125069195","https://openalex.org/W2143964548","https://openalex.org/W2145339207","https://openalex.org/W2155968351","https://openalex.org/W2168359464","https://openalex.org/W2261891975","https://openalex.org/W2566610034","https://openalex.org/W2570767044","https://openalex.org/W2575705757","https://openalex.org/W2584265939","https://openalex.org/W2593044849","https://openalex.org/W2790514337","https://openalex.org/W2807557496","https://openalex.org/W2809375916","https://openalex.org/W2962824803","https://openalex.org/W2963063317","https://openalex.org/W2963121817","https://openalex.org/W2963714390","https://openalex.org/W2964078006","https://openalex.org/W3099664902","https://openalex.org/W6635508374","https://openalex.org/W6637967152","https://openalex.org/W6676928577","https://openalex.org/W6681861716","https://openalex.org/W6692453020","https://openalex.org/W6693378663","https://openalex.org/W6703780166","https://openalex.org/W6712730493","https://openalex.org/W6733472783","https://openalex.org/W6734206676","https://openalex.org/W6738570108"],"related_works":["https://openalex.org/W3003775893","https://openalex.org/W3095437761","https://openalex.org/W3127517176","https://openalex.org/W2811111819","https://openalex.org/W2025448855","https://openalex.org/W76760840","https://openalex.org/W1925600676","https://openalex.org/W2024877309","https://openalex.org/W2791803308","https://openalex.org/W3015442441","https://openalex.org/W3040858909","https://openalex.org/W2111770102","https://openalex.org/W2770014065","https://openalex.org/W2149738224","https://openalex.org/W3151079898","https://openalex.org/W2963516265","https://openalex.org/W3108136459","https://openalex.org/W2892978054","https://openalex.org/W2569188995","https://openalex.org/W2103064945"],"abstract_inverted_index":{"In":[0,69],"this":[1],"paper,":[2],"we":[3],"propose":[4],"a":[5,23,33,52,144,150],"novel":[6,172],"Reinforcement":[7,129],"Learning":[8],"approach":[9],"for":[10,105,180],"solving":[11],"the":[12,44,49,59,71,86,112,133,159,163,168,171],"Active":[13],"Information":[14],"Acquisition":[15],"problem,":[16],"which":[17,122],"requires":[18],"an":[19,89,175],"agent":[20],"to":[21,29,100,119,174],"choose":[22],"sequence":[24],"of":[25,35,51,61,74,108,135,147,162,170],"actions":[26],"in":[27,43,95,138],"order":[28],"acquire":[30],"information":[31,45,139,177],"about":[32],"process":[34],"interest":[36],"using":[37],"on-board":[38],"sensors.":[39],"The":[40],"classic":[41],"challenges":[42],"acquisition":[46,178],"problem":[47],"are":[48,98,116],"dependence":[50],"planning":[53,114,136],"algorithm":[54,173],"on":[55,82],"known":[56],"models":[57,83],"and":[58,84,103,166],"difficulty":[60],"computing":[62],"information-theoretic":[63],"cost":[64],"functions":[65],"over":[66,149],"arbitrary":[67],"distributions.":[68],"contrast,":[70],"proposed":[72,164],"framework":[73,165],"reinforcement":[75],"learning":[76,130],"does":[77],"not":[78],"require":[79],"any":[80],"knowledge":[81],"alleviates":[85],"problems":[87,140],"during":[88],"extended":[90],"training":[91],"stage.":[92],"It":[93],"results":[94],"policies":[96],"that":[97],"efficient":[99],"execute":[101],"online":[102],"applicable":[104],"real-time":[106],"control":[107],"robotic":[109],"systems.":[110],"Furthermore,":[111],"state-of-the-art":[113],"methods":[115],"typically":[117],"restricted":[118],"short":[120],"horizons,":[121],"may":[123],"become":[124],"problematic":[125],"with":[126],"local":[127],"minima.":[128],"naturally":[131],"handles":[132],"issue":[134],"horizon":[137],"as":[141],"it":[142],"maximizes":[143],"discounted":[145],"sum":[146],"rewards":[148],"long":[151],"finite":[152],"or":[153],"infinite":[154],"time":[155],"horizon.":[156],"We":[157],"discuss":[158],"potential":[160],"benefits":[161],"compare":[167],"performance":[169],"existing":[176],"method":[179],"multi-target":[181],"tracking":[182],"scenarios.":[183]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
