-
Notifications
You must be signed in to change notification settings - Fork 12
/
Lectures 1-5.tex
54 lines (40 loc) · 1.25 KB
/
Lectures 1-5.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
\documentclass[12pt]{book}
\usepackage{graphicx,ae}
\usepackage{color}
\usepackage{amsmath}
\usepackage{amssymb}
% \usepackage{hyperref}
\usepackage{fullpage}
\usepackage{natbib}
\usepackage{framed}
\newcommand{\ymignore}[1]{}
\usepackage{hyperref}
\input{defs}
\renewcommand{\SM}[1]{}
\title{Reinforcement Learning: Foundations}
\date{February 2023
\\
\textcolor{red}{This book is still work in progress. In particular, references to literature are not complete. We would be grateful for comments, suggestions, omissions, and errors of any kind, at \url{rlfoundationsbook@gmail.com}. }
}
\author{Shie Mannor, Yishay Mansour and Aviv Tamar}
\begin{document}
\maketitle
\tableofcontents
\chapter{Dynamic Programming}
\label{chapter:dp}
\input{current_chapters/appendix-dp}
\chapter{Deterministic Decision Processes}
\label{chapter:DDP}
\input{current_chapters/chapter2-ddp}
\chapter{Markov Chains}
\label{chapter:MC}
\input{current_chapters/chapter3-mc}
\chapter{Markov Decision Processes and Finite Horizon Dynamic Programming}
\label{chapter:MDP-FH}
\input{current_chapters/chapter4-mdp-fh}
\chapter{Discounted Markov Decision Processes}
\label{chapter:disc}
\input{current_chapters/chapter5-disc}
\bibliographystyle{plain}
\bibliography{bib-lecture}
\end{document}