-
Notifications
You must be signed in to change notification settings - Fork 6
/
main.tex
35 lines (29 loc) · 865 Bytes
/
main.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
\documentclass{jsarticle}
\usepackage[fleqn]{amsmath}
\usepackage{graphicx}
% commands
\newcommand{\argmin}{\mathop{\rm argmin}}
\newcommand{\argmax}{\mathop{\rm argmax}}
\newcommand{\States}{\mathcal{X}}
\newcommand{\Actions}{\mathcal{A}}
\newcommand{\st}{x}
\newcommand{\St}{X}
\newcommand{\action}{a}
\newcommand{\nextaction}{a'}
\newcommand{\Action}{A}
\newcommand{\Nextaction}{A'}
\newcommand{\reward}{r}
\newcommand{\Reward}{R}
\newcommand{\MDP}{\mathcal{M}}
\newcommand{\nextstate}{y}
\newcommand{\Nextstate}{Y}
\date{}
\title{szepesvari本: 数式補足}
\begin{document}
\maketitle
\section*{2.4 Dynamic programming algorithms for solving MDPs}
\subsection*{$Q^{k}$に対してグリーディな方策に関するバウンドの証明}
\begin{equation}
V^\pi(\st) \ge V^*(\st) - \frac{2}{1-\gamma} \, \|Q-Q^*\|_{\infty}
\end{equation}
\end{document}