{"id":5536,"date":"2023-03-06T20:33:55","date_gmt":"2023-03-06T20:33:55","guid":{"rendered":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/"},"modified":"2026-01-22T09:42:16","modified_gmt":"2026-01-22T14:42:16","slug":"reinforcement-learning","status":"publish","type":"resource","link":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/","title":{"rendered":"Reinforcement Learning"},"content":{"rendered":"","protected":false},"excerpt":{"rendered":"","protected":false},"featured_media":10748,"template":"","resource-type":[303],"resource-user":[302],"application":[524,521],"class_list":["post-5536","resource","type-resource","status-publish","has-post-thumbnail","hentry","resource-type-whitepapers","resource-user-matlab","application-applied-ai","application-control-systems-dynamics"],"acf":[],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v26.8 - https:\/\/yoast.com\/product\/yoast-seo-wordpress\/ -->\n<title>Reinforcement Learning - Quanser<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"Reinforcement Learning - Quanser\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/\" \/>\n<meta property=\"og:site_name\" content=\"Quanser\" \/>\n<meta property=\"article:modified_time\" content=\"2026-01-22T14:42:16+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg\" \/>\n\t<meta property=\"og:image:width\" content=\"2500\" \/>\n\t<meta property=\"og:image:height\" content=\"1040\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/jpeg\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data1\" content=\"1 minute\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/\",\"url\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/\",\"name\":\"Reinforcement Learning - Quanser\",\"isPartOf\":{\"@id\":\"https:\/\/www.quanser.com\/#website\"},\"primaryImageOfPage\":{\"@id\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#primaryimage\"},\"image\":{\"@id\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#primaryimage\"},\"thumbnailUrl\":\"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg\",\"datePublished\":\"2023-03-06T20:33:55+00:00\",\"dateModified\":\"2026-01-22T14:42:16+00:00\",\"breadcrumb\":{\"@id\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#breadcrumb\"},\"inLanguage\":\"en-US\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"en-US\",\"@id\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#primaryimage\",\"url\":\"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg\",\"contentUrl\":\"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg\",\"width\":2500,\"height\":1040},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"Home\",\"item\":\"https:\/\/www.quanser.com\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"Reinforcement Learning\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.quanser.com\/#website\",\"url\":\"https:\/\/www.quanser.com\/\",\"name\":\"Quanser\",\"description\":\"Innovate Educate\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.quanser.com\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"en-US\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"Reinforcement Learning - Quanser","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/","og_locale":"en_US","og_type":"article","og_title":"Reinforcement Learning - Quanser","og_url":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/","og_site_name":"Quanser","article_modified_time":"2026-01-22T14:42:16+00:00","og_image":[{"width":2500,"height":1040,"url":"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg","type":"image\/jpeg"}],"twitter_card":"summary_large_image","twitter_misc":{"Est. reading time":"1 minute"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/","url":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/","name":"Reinforcement Learning - Quanser","isPartOf":{"@id":"https:\/\/www.quanser.com\/#website"},"primaryImageOfPage":{"@id":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#primaryimage"},"image":{"@id":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#primaryimage"},"thumbnailUrl":"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg","datePublished":"2023-03-06T20:33:55+00:00","dateModified":"2026-01-22T14:42:16+00:00","breadcrumb":{"@id":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.quanser.com\/resource\/reinforcement-learning\/"]}]},{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#primaryimage","url":"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg","contentUrl":"https:\/\/www.quanser.com\/wp-content\/uploads\/2023\/03\/Webpage-Banner.jpg","width":2500,"height":1040},{"@type":"BreadcrumbList","@id":"https:\/\/www.quanser.com\/resource\/reinforcement-learning\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/www.quanser.com\/"},{"@type":"ListItem","position":2,"name":"Reinforcement Learning"}]},{"@type":"WebSite","@id":"https:\/\/www.quanser.com\/#website","url":"https:\/\/www.quanser.com\/","name":"Quanser","description":"Innovate Educate","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.quanser.com\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"}]}},"_links":{"self":[{"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/resource\/5536","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/resource"}],"about":[{"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/types\/resource"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/media\/10748"}],"wp:attachment":[{"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/media?parent=5536"}],"wp:term":[{"taxonomy":"resource-type","embeddable":true,"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/resource-type?post=5536"},{"taxonomy":"resource-user","embeddable":true,"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/resource-user?post=5536"},{"taxonomy":"application","embeddable":true,"href":"https:\/\/www.quanser.com\/wp-json\/wp\/v2\/application?post=5536"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}