#EXTM3U #EXT-SL-VERSION:1 #EXT-SL-ACCOUNT-ID:37001 #EXT-SL-PRESENTATION-ID:38941292 #EXT-SL-PRESENTATION-TITLE:Maximum Reward Formulation In Reinforcement Learning #EXT-SL-PRESENTATION-UPDATED-AT:2023-10-20T13:45:23Z #EXT-SL-PLAYER-TYPE:video_slideshow #EXT-SL-PRESENTATION-THUMBNAIL:https://ma.slideslive.com/library/presentations/38941292/thumbnail/maximum-reward-formulation-in-reinforcement-learning_sUcGR1_big.jpg #EXT-SL-SLIDESLIVE-LOGO-VISIBLE:false #EXT-SL-SLIDESLIVE-LOGO-LINKIFY:false #EXT-SL-CUSTOM-CMCD-TRACKING:false #EXT-SL-PLAYLIST-TYPE:vod #EXT-SL-PRESENTATION-MEDIA-SET-ID:84061 #EXT-SL-VOD-VIDEO-SERVICE-NAME:yoda #EXT-SL-VOD-VIDEO-ID:ruBkJItzZ1XN #EXT-SL-VOD-VIDEO-KEN-ENABLED:true #EXT-SL-VOD-VIDEO-SERVERS:["sl-yoda-v3-stream-015-alpha.b-cdn.net","1963568160.rsc.cdn77.org","1940033649.rsc.cdn77.org","sl-yoda-v3-stream-015-beta.b-cdn.net"] #EXT-SL-VOD-SLIDES-XML-URL:https://s.slideslive.com/38941292/v2/38941292.xml?1642088694 #EXT-SL-VOD-SLIDES-JSON-URL:https://s.slideslive.com/38941292/v2/slides.json?1642088694 #EXT-SL-VOD-SUBTITLES:[{"name":"English","language":"en","subtitles_id":43588,"webvtt_url":"https://slideslive-video-subtitles.s3.amazonaws.com/43588/subtitles.vtt?X-Amz-Algorithm=AWS4-HMAC-SHA256\u0026X-Amz-Credential=AKIAXWNGJW2E2DUNCDBO%2F20241115%2Fus-east-1%2Fs3%2Faws4_request\u0026X-Amz-Date=20241115T041607Z\u0026X-Amz-Expires=86400\u0026X-Amz-SignedHeaders=host\u0026X-Amz-Signature=72c30c48acd3d96f2c47491c2dc44f1d5abbf5b78dd8629a53d835a917bb47b8"}]