<?xml version="1.0" encoding="utf-8" standalone="yes" ?>
<rss version="2.0" 
  xmlns:content="http://purl.org/rss/1.0/modules/content/" 
  xmlns:dc="http://purl.org/dc/elements/1.1/" 
  xmlns:atom="http://www.w3.org/2005/Atom" 
  xmlns:sy="http://purl.org/rss/1.0/modules/syndication/" 
  xmlns:media="http://search.yahoo.com/mrss/">
  <channel>
    <title>模倣学習 on 行李の底に収めたり[YuWd]</title>
    <link>https://yuiga.dev/blog/en/tags/%E6%A8%A1%E5%80%A3%E5%AD%A6%E7%BF%92/</link>
    <description>Recent content in 模倣学習 on 行李の底に収めたり[YuWd]</description>
    <generator>Hugo -- gohugo.io</generator>
    <language>en</language>
    <copyright>©2026, All Rights Reserved</copyright>
    <lastBuildDate>Sun, 26 Jun 2022 17:15:40 +0900</lastBuildDate>
    
        <atom:link href="https://yuiga.dev/blog/en/tags/%E6%A8%A1%E5%80%A3%E5%AD%A6%E7%BF%92/index.xml" rel="self" type="application/rss+xml" />
    

      
      <item>
        <title>DAgger algorithm</title>
        <link>https://yuiga.dev/blog/en/ja/posts/dagger_algorithm/</link>
        <pubDate>Sun, 26 Jun 2022 17:15:40 +0900</pubDate>
        
        <atom:modified>Sun, 26 Jun 2022 17:15:40 +0900</atom:modified>
        <guid>https://yuiga.dev/blog/en/ja/posts/dagger_algorithm/</guid>
        <description>状態: $s \in S$ 行動: $a \in A$ 方策: $\pi$ $\pi : S \rightarrow A$ と定義 累積的にデータセットを増やしながら方策を学習していく感じ 誤差が少ないらしい</description>
        
        <dc:creator>YuWd (Yuiga Wada)</dc:creator>
        <media:content url="https://yuiga.dev/bloghttps://gyazo.com/48b3fd234d5366fec45ccbae2bc3b9b3.png" medium="image"><media:title type="html">featured image</media:title></media:content>
        
        
        
          
            
              <category>模倣学習</category>
            
          
            
              <category>強化学習</category>
            
          
            
              <category>post</category>
            
          
        
        
        
          
            
          
        
      </item>
      

    
  </channel>
</rss>
