046203_lectures_2023/Lectures 1-5.tex

\documentclass[12pt]{book}
\usepackage{graphicx,ae}
\usepackage{color}
\usepackage{amsmath}
\usepackage{amssymb}
% \usepackage{hyperref}
\usepackage{fullpage}
\usepackage{natbib}
\usepackage{framed}

\newcommand{\ymignore}[1]{}
\usepackage{hyperref}


\input{defs}
\renewcommand{\SM}[1]{}

\title{Reinforcement Learning: Foundations}
\date{February 2023
\\
  \textcolor{red}{This book is still work in progress. In particular, references to literature are not complete. We would be grateful for comments, suggestions, omissions, and errors of any kind, at \url{rlfoundationsbook@gmail.com}. }

}
\author{Shie Mannor, Yishay Mansour and Aviv Tamar}


\begin{document}
\maketitle

\tableofcontents

\chapter{Dynamic Programming}
\label{chapter:dp}
\input{current_chapters/appendix-dp}

\chapter{Deterministic Decision Processes}
\label{chapter:DDP}
\input{current_chapters/chapter2-ddp}

\chapter{Markov Chains}
\label{chapter:MC}
\input{current_chapters/chapter3-mc}

\chapter{Markov Decision Processes and Finite Horizon Dynamic Programming}
\label{chapter:MDP-FH}
\input{current_chapters/chapter4-mdp-fh}

\chapter{Discounted Markov Decision Processes}
\label{chapter:disc}
\input{current_chapters/chapter5-disc}

\bibliographystyle{plain}
\bibliography{bib-lecture}
\end{document}