#EXTM3U #EXT-SL-VERSION:1 #EXT-SL-ACCOUNT-ID:37001 #EXT-SL-PRESENTATION-ID:38941569 #EXT-SL-PRESENTATION-TITLE:DEEPAVERAGES: Offline Reinforcement Learn-Ing by Solving Derived Non-Parametric MDPs #EXT-SL-PRESENTATION-UPDATED-AT:2023-10-20T13:47:31Z #EXT-SL-PLAYER-TYPE:video_slideshow #EXT-SL-PRESENTATION-THUMBNAIL:https://ma.slideslive.com/library/presentations/38941569/thumbnail/deepaverages-offline-reinforcement-learning-by-solving-derived-nonparametric-mdps_oJqrIv_big.jpg #EXT-SL-SLIDESLIVE-LOGO-VISIBLE:false #EXT-SL-SLIDESLIVE-LOGO-LINKIFY:false #EXT-SL-CUSTOM-CMCD-TRACKING:false #EXT-SL-PLAYLIST-TYPE:vod #EXT-SL-PRESENTATION-MEDIA-SET-ID:97411 #EXT-SL-VOD-VIDEO-SERVICE-NAME:yoda #EXT-SL-VOD-VIDEO-ID:hubRHBMmUt6U #EXT-SL-VOD-VIDEO-KEN-ENABLED:true #EXT-SL-VOD-VIDEO-SERVERS:["sl-yoda-v3-stream-014-alpha.b-cdn.net","1978117156.rsc.cdn77.org","1243944885.rsc.cdn77.org","sl-yoda-v3-stream-014-beta.b-cdn.net"] #EXT-SL-VOD-SLIDES-XML-URL:https://s.slideslive.com/38941569/v3/38941569.xml?1642091706 #EXT-SL-VOD-SLIDES-JSON-URL:https://s.slideslive.com/38941569/v3/slides.json?1642091706 #EXT-SL-VOD-SUBTITLES:[{"name":"English","language":"en","subtitles_id":43834,"webvtt_url":"https://slideslive-video-subtitles.s3.amazonaws.com/43834/subtitles.vtt?X-Amz-Algorithm=AWS4-HMAC-SHA256\u0026X-Amz-Credential=AKIAXWNGJW2E2DUNCDBO%2F20241115%2Fus-east-1%2Fs3%2Faws4_request\u0026X-Amz-Date=20241115T032818Z\u0026X-Amz-Expires=86400\u0026X-Amz-SignedHeaders=host\u0026X-Amz-Signature=682eb81d227bcc04108367de6afff325230cbe632808d322a1f7abfe3ca21295"}]