<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<oembed>
  <author_name>sysdev-product2</author_name>
  <author_url>https://blog.hatena.ne.jp/sysdev-product2/</author_url>
  <blog_title>MONEX ENGINEER BLOG │マネックス エンジニアブログ</blog_title>
  <blog_url>https://blog.tech-monex.com/</blog_url>
  <categories>
  </categories>
  <description>The fundamental goal of reinforcement learning is to train an agent to make sequential decisions that maximize its cumulative reward over time. This involves the agent learning an optimal policy that maps a given state to an action to achieve the highest possible return. Mathematically, this process…</description>
  <height>190</height>
  <html>&lt;iframe src=&quot;https://hatenablog-parts.com/embed?url=https%3A%2F%2Fblog.tech-monex.com%2Fentry%2F2025%2F11%2F04%2F144404&quot; title=&quot;The Fundamentals of Reinforcement Learning - MONEX ENGINEER BLOG │マネックス エンジニアブログ&quot; class=&quot;embed-card embed-blogcard&quot; scrolling=&quot;no&quot; frameborder=&quot;0&quot; style=&quot;display: block; width: 100%; height: 190px; max-width: 500px; margin: 10px 0px;&quot;&gt;&lt;/iframe&gt;</html>
  <image_url></image_url>
  <provider_name>Hatena Blog</provider_name>
  <provider_url>https://hatena.blog</provider_url>
  <published>2025-11-04 14:44:04</published>
  <title>The Fundamentals of Reinforcement Learning</title>
  <type>rich</type>
  <url>https://blog.tech-monex.com/entry/2025/11/04/144404</url>
  <version>1.0</version>
  <width>100%</width>
</oembed>
