{"id":663258,"date":"2020-05-29T14:43:18","date_gmt":"2020-05-29T21:43:18","guid":{"rendered":"https:\/\/www.microsoft.com\/en-us\/research\/?post_type=msr-group&#038;p=663258"},"modified":"2021-10-26T13:20:23","modified_gmt":"2021-10-26T20:20:23","slug":"reinforcement-learning-montreal","status":"publish","type":"msr-group","link":"https:\/\/www.microsoft.com\/en-us\/research\/theme\/reinforcement-learning-montreal\/","title":{"rendered":"Reinforcement Learning | Montr\u00e9al"},"content":{"rendered":"<section class=\"mb-3 moray-highlight\">\n\t<div class=\"card-img-overlay mx-lg-0\">\n\t\t<div class=\"card-background  has-background- card-background--full-bleed\">\n\t\t\t<img loading=\"lazy\" decoding=\"async\" width=\"3840\" height=\"1440\" src=\"https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720.png\" class=\"attachment-full size-full\" alt=\"MSR theme: Reinforcement Learning Research\" style=\"\" srcset=\"https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720.png 3840w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-300x113.png 300w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-1024x384.png 1024w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-768x288.png 768w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-1536x576.png 1536w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-2048x768.png 2048w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-1920x720.png 1920w, https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2012\/12\/Theme-navy_RL_header_12_2019__1920x720-1600x600.png 1600w\" sizes=\"auto, (max-width: 3840px) 100vw, 3840px\" \/>\t\t<\/div>\n\t\t<!-- Foreground -->\n\t\t<div class=\"card-foreground d-flex mt-md-n5 my-lg-5 px-g px-lg-0\">\n\t\t\t<!-- Container -->\n\t\t\t<div class=\"container d-flex mt-md-n5 my-lg-5 align-self-center\">\n\t\t\t\t<!-- Card wrapper -->\n\t\t\t\t<div class=\"w-100 w-lg-col-5\">\n\t\t\t\t\t<!-- Card -->\n\t\t\t\t\t<div class=\"card material-md-card py-5 px-md-5\">\n\t\t\t\t\t\t<div class=\"card-body \">\n\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t<a href=\"https:\/\/www.microsoft.com\/en-us\/research\/lab\/microsoft-research-montreal\/\" class=\"icon-link icon-link--reverse mb-2\" data-bi-cN=\"Return to Microsoft Research Lab \u2013 Montr\u00e9al\">\n\t\t\t\t\t\t\t\t\t<span class=\"c-glyph glyph-chevron-left\" aria-hidden=\"true\"><\/span>\n\t\t\t\t\t\t\t\t\tReturn to Microsoft Research Lab \u2013 Montr\u00e9al\t\t\t\t\t\t\t\t<\/a>\n\t\t\t\t\t\t\t\n\t\t\t\t\t\t\t\n\n<h1 id=\"reinforcement-learning-montreal\" class=\"h2\">Reinforcement Learning | Montr\u00e9al<\/h1>\n\n\t\t\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t<\/div>\n\t\t<\/div>\n\t<\/div>\n<\/section>\n\n\n\n\n\n<p>MSR Montr\u00e9al focuses on improving the understanding of fundamental concepts in (deep) Reinforcement Learning (RL) and addressing the open problems that need to be overcome to employ RL on a large scale in the real world. For this reason, we work on challenges such as sample-efficiency, (systematic) generalization and robustness\/safety of methods.<\/p>\n\n\n","protected":false},"excerpt":{"rendered":"<p>MSR Montr\u00e9al focuses on improving the understanding of fundamental concepts in (deep) Reinforcement Learning (RL) and addressing the open problems that need to be overcome to employ RL on a large scale in the real world.<\/p>\n","protected":false},"featured_media":627639,"template":"","meta":{"msr-url-field":"","msr-podcast-episode":"","msrModifiedDate":"","msrModifiedDateEnabled":false,"ep_exclude_from_search":false,"_classifai_error":"","msr_group_start":"","footnotes":""},"research-area":[13556],"msr-group-type":[243688],"msr-locale":[268875],"msr-impact-theme":[],"class_list":["post-663258","msr-group","type-msr-group","status-publish","has-post-thumbnail","hentry","msr-research-area-artificial-intelligence","msr-group-type-theme","msr-locale-en_us"],"msr_group_start":"","msr_detailed_description":"","msr_further_details":"","msr_hero_images":[],"msr_research_lab":[437514],"related-researchers":[],"related-publications":[443202,487844,487835,487826,487817,481131,453927,443232,443226,443211,493226,443193,443172,442749,442737,442731,442725,442719,442713,442698,620553,757882,757876,659109,659103,659097,659091,659082,643866,643860,442692,620541,610218,600384,595489,580996,580987,580978,580795,401753,401894,401885,401858,401849,401843,401816,401798,401771,401762,401912,401741,401711,401657,401615,401603,401585,401570,401555,401546,402272,442686,442680,442668,442662,442656,442647,442641,442635,442623,401534,402005,401996,401987,401978,401969,401960,401951,401930],"related-downloads":[],"related-videos":[794069,794099],"related-projects":[615297,577638],"related-events":[],"related-opportunities":[],"related-posts":[455721,590815,720673],"tab-content":[],"msr_impact_theme":[],"_links":{"self":[{"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-group\/663258","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-group"}],"about":[{"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/types\/msr-group"}],"version-history":[{"count":11,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-group\/663258\/revisions"}],"predecessor-version":[{"id":1168710,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-group\/663258\/revisions\/1168710"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/media\/627639"}],"wp:attachment":[{"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/media?parent=663258"}],"wp:term":[{"taxonomy":"msr-research-area","embeddable":true,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/research-area?post=663258"},{"taxonomy":"msr-group-type","embeddable":true,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-group-type?post=663258"},{"taxonomy":"msr-locale","embeddable":true,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-locale?post=663258"},{"taxonomy":"msr-impact-theme","embeddable":true,"href":"https:\/\/www.microsoft.com\/en-us\/research\/wp-json\/wp\/v2\/msr-impact-theme?post=663258"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}