#EXTM3U #EXT-SL-VERSION:1 #EXT-SL-ACCOUNT-ID:37001 #EXT-SL-PRESENTATION-ID:38941305 #EXT-SL-PRESENTATION-TITLE:Greedy Multi-Step Off-Policy Reinforcement Learning #EXT-SL-PRESENTATION-UPDATED-AT:2023-10-20T13:45:28Z #EXT-SL-PLAYER-TYPE:video_slideshow #EXT-SL-PRESENTATION-THUMBNAIL:https://ma.slideslive.com/library/presentations/38941305/thumbnail/greedy-multistep-offpolicy-reinforcement-learning_ftQUA2_big.jpg #EXT-SL-SLIDESLIVE-LOGO-VISIBLE:false #EXT-SL-SLIDESLIVE-LOGO-LINKIFY:false #EXT-SL-CUSTOM-CMCD-TRACKING:false #EXT-SL-PLAYLIST-TYPE:vod #EXT-SL-PRESENTATION-MEDIA-SET-ID:84073 #EXT-SL-VOD-VIDEO-SERVICE-NAME:yoda #EXT-SL-VOD-VIDEO-ID:Vz1uhYNXq1IY #EXT-SL-VOD-VIDEO-KEN-ENABLED:true #EXT-SL-VOD-VIDEO-SERVERS:["sl-yoda-v3-stream-014-alpha.b-cdn.net","1978117156.rsc.cdn77.org","1243944885.rsc.cdn77.org","sl-yoda-v3-stream-014-beta.b-cdn.net"] #EXT-SL-VOD-SLIDES-XML-URL:https://s.slideslive.com/38941305/v3/38941305.xml?1642088702 #EXT-SL-VOD-SLIDES-JSON-URL:https://s.slideslive.com/38941305/v3/slides.json?1642088702 #EXT-SL-VOD-SUBTITLES:[{"name":"English","language":"en","subtitles_id":43602,"webvtt_url":"https://slideslive-video-subtitles.s3.amazonaws.com/43602/subtitles.vtt?X-Amz-Algorithm=AWS4-HMAC-SHA256\u0026X-Amz-Credential=AKIAXWNGJW2E2DUNCDBO%2F20241115%2Fus-east-1%2Fs3%2Faws4_request\u0026X-Amz-Date=20241115T043010Z\u0026X-Amz-Expires=86400\u0026X-Amz-SignedHeaders=host\u0026X-Amz-Signature=90348c8b473b8527fc539581d7f58d7d6da4a78e60ee1cb8db49e4958093a3c6"}]