{"id":"https://openalex.org/W2613999312","doi":"https://doi.org/10.1109/icit.2017.7915468","title":"Model based path planning using Q-Learning","display_name":"Model based path planning using Q-Learning","publication_year":2017,"publication_date":"2017-03-01","ids":{"openalex":"https://openalex.org/W2613999312","doi":"https://doi.org/10.1109/icit.2017.7915468","mag":"2613999312"},"language":"en","primary_location":{"id":"doi:10.1109/icit.2017.7915468","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icit.2017.7915468","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Industrial Technology (ICIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101797742","display_name":"Avinash Sharma","orcid":"https://orcid.org/0000-0001-8045-0332"},"institutions":[{"id":"https://openalex.org/I83205935","display_name":"Malaviya National Institute of Technology Jaipur","ror":"https://ror.org/0077k1j32","country_code":"IN","type":"education","lineage":["https://openalex.org/I83205935"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Avinash Sharma","raw_affiliation_strings":["Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India","institution_ids":["https://openalex.org/I83205935"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103427688","display_name":"Kanika Gupta","orcid":null},"institutions":[{"id":"https://openalex.org/I83205935","display_name":"Malaviya National Institute of Technology Jaipur","ror":"https://ror.org/0077k1j32","country_code":"IN","type":"education","lineage":["https://openalex.org/I83205935"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Kanika Gupta","raw_affiliation_strings":["Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India","institution_ids":["https://openalex.org/I83205935"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006403584","display_name":"Anirudha Kumar","orcid":null},"institutions":[{"id":"https://openalex.org/I83205935","display_name":"Malaviya National Institute of Technology Jaipur","ror":"https://ror.org/0077k1j32","country_code":"IN","type":"education","lineage":["https://openalex.org/I83205935"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Anirudha Kumar","raw_affiliation_strings":["Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India","institution_ids":["https://openalex.org/I83205935"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028415302","display_name":"Aishwarya Sharma","orcid":"https://orcid.org/0009-0007-2529-3267"},"institutions":[{"id":"https://openalex.org/I83205935","display_name":"Malaviya National Institute of Technology Jaipur","ror":"https://ror.org/0077k1j32","country_code":"IN","type":"education","lineage":["https://openalex.org/I83205935"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Aishwarya Sharma","raw_affiliation_strings":["Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India","institution_ids":["https://openalex.org/I83205935"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052848876","display_name":"Rajesh Kumar","orcid":"https://orcid.org/0000-0002-6019-0702"},"institutions":[{"id":"https://openalex.org/I83205935","display_name":"Malaviya National Institute of Technology Jaipur","ror":"https://ror.org/0077k1j32","country_code":"IN","type":"education","lineage":["https://openalex.org/I83205935"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rajesh Kumar","raw_affiliation_strings":["Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Malaviya National Institute of Technology, Jaipur, India","institution_ids":["https://openalex.org/I83205935"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101797742"],"corresponding_institution_ids":["https://openalex.org/I83205935"],"apc_list":null,"apc_paid":null,"fwci":1.4551,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.8650381,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"837","last_page":"842"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8717877864837646},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7760283946990967},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.6749844551086426},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6576425433158875},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.6019086837768555},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5978472828865051},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.5550841093063354},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.5533216595649719},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5320597290992737},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.5268284678459167},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4739679992198944},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.47016212344169617},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.457472562789917},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.45565155148506165},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.44625574350357056},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.28321999311447144},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13424432277679443}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8717877864837646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7760283946990967},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6749844551086426},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6576425433158875},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.6019086837768555},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5978472828865051},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.5550841093063354},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.5533216595649719},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5320597290992737},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.5268284678459167},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4739679992198944},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.47016212344169617},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.457472562789917},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.45565155148506165},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.44625574350357056},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.28321999311447144},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13424432277679443},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icit.2017.7915468","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icit.2017.7915468","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Industrial Technology (ICIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.5699999928474426,"display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W16593501","https://openalex.org/W1874218954","https://openalex.org/W1965640670","https://openalex.org/W1977655452","https://openalex.org/W1982803779","https://openalex.org/W1997208542","https://openalex.org/W2012587148","https://openalex.org/W2080759927","https://openalex.org/W2082691056","https://openalex.org/W2095705004","https://openalex.org/W2098049033","https://openalex.org/W2111305343","https://openalex.org/W2111967991","https://openalex.org/W2119717200","https://openalex.org/W2149860990","https://openalex.org/W2155007355","https://openalex.org/W2161966552","https://openalex.org/W2169209873","https://openalex.org/W4205513846","https://openalex.org/W4214717370","https://openalex.org/W4237733001","https://openalex.org/W4285719527","https://openalex.org/W4298857966","https://openalex.org/W6600698939","https://openalex.org/W6674330103","https://openalex.org/W6676560026","https://openalex.org/W6682093400","https://openalex.org/W6683603353","https://openalex.org/W6685331716"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W2166117066","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W3087814763","https://openalex.org/W2892507673","https://openalex.org/W2361647908","https://openalex.org/W2937181779","https://openalex.org/W2537866915","https://openalex.org/W3127551068"],"abstract_inverted_index":{"Though":[0],"the":[1,20,42,88,96,101,115,134,138,148,154,161,166],"classical":[2],"robotics":[3],"is":[4,16,130,143],"highly":[5],"proficient":[6],"in":[7,24,32,41,71,100,133],"accomplishing":[8],"a":[9,62,108,125],"lot":[10],"of":[11,26,87,91,137,165],"complex":[12],"tasks,":[13],"still":[14],"it":[15],"far":[17],"from":[18],"exhibiting":[19],"human-like":[21],"natural":[22],"intelligence":[23],"terms":[25],"flexibility":[27],"and":[28,163],"reliability":[29,164],"to":[30,37,48,67,69,84,146],"work":[31,70],"dynamic":[33],"scenarios.":[34,104],"In":[35],"order":[36],"render":[38],"these":[39],"qualities":[40],"robots,":[43],"reinforcement":[44,59],"learning":[45,54,60,77],"could":[46],"prove":[47],"be":[49,65,80],"quite":[50,81,98],"effective.":[51],"By":[52],"employing":[53],"based":[55,110,118,127],"training":[56,92,97,136,168],"provided":[57],"by":[58,152],"methods,":[61],"robot":[63],"can":[64,79],"made":[66],"learn":[68,147],"previously":[72],"unforeseen":[73],"situations.":[74],"Still":[75],"this":[76],"task":[78],"cumbersome":[82],"due":[83],"its":[85],"requirement":[86],"huge":[89],"amount":[90],"data":[93],"which":[94,129],"makes":[95],"inefficient":[99],"real":[102,149,155],"world":[103,150,156],"The":[105,120,140],"paper":[106],"proposes":[107],"model":[109],"path":[111],"planning":[112],"method":[113],"using":[114,124,153],"\u03b5":[116],"greedy":[117],"Q-learning.":[119],"scenario":[121],"was":[122],"modeled":[123],"grid-world":[126],"simulator":[128],"being":[131],"used":[132],"initial":[135],"agent.":[139],"trained":[141],"policy":[142],"then":[144],"improved":[145],"dynamics":[151],"samples.":[157],"This":[158],"study":[159],"proves":[160],"efficiency":[162],"simulator-based":[167],"methodology.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":3}],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
