Browse Source

Add citations and result table

master
Markus Kaiser 1 year ago
parent
commit
35874e5d75
3 changed files with 66 additions and 17 deletions
  1. +2
    -2
      esann-talk/figures/policy_quiver.tex
  2. +57
    -15
      esann-talk/interpretable_dynamics_models.tex
  3. +7
    -0
      zotero_export.bib

+ 2
- 2
esann-talk/figures/policy_quiver.tex View File

@ -10,8 +10,8 @@
\def\datapath{\figurepath/data}
\begin{axis}[
result plot,
width=.4\plottextwidth,
height=.4\plottextwidth,
width=.45\plottextwidth,
height=.45\plottextwidth,
colormap/RdYlBu,
]

+ 57
- 15
esann-talk/interpretable_dynamics_models.tex View File

@ -17,6 +17,14 @@
\mathtoolsset{showonlyrefs,showmanualtags}
\usepackage{xfrac}
% Table
\usepackage{etoolbox}
\robustify\bfseries
\usepackage{colortbl}
\usepackage{booktabs}
\usepackage{tabularx}
\usepackage{siunitx}
% Theme and Font
\usetheme{metropolis}
\usecolortheme{metropolis-siemens}
@ -54,18 +62,14 @@
\input{figures/preamble/tikz_jumping.tex}
% Bibliography
\usepackage[style=authoryear, backend=biber, url=false]{biblatex}
\addbibresource{../zotero_export.bib}
\title{Interpretable Dynamics Models}
\subtitle{Data-Efficient Reinforcement Learning}
\subtitle{For Data-Efficient Reinforcement Learning}
\date{April 24, 2019}
% \author{%
% Markus Kaiser, \href{mailto:markus.kaiser@siemens.com}{markus.kaiser@siemens.com}
% \texorpdfstring{\\}{, }
% Clemens Otte
% \texorpdfstring{\\}{, }
% Thomas A. Runkler
% \texorpdfstring{\\}{, }
% Carl Henrik Ek
% }
\author{%
Markus Kaiser,
Clemens Otte,
@ -89,7 +93,7 @@
}
\includeonlyframes{policy}
% \includeonlyframes{policy,bibliography}
\begin{document}
@ -110,7 +114,7 @@
\end{frame}
\begin{frame}[label=wetchicken]{Wetchicken Benchmark}
\begin{frame}[label=wetchicken]{Wet-Chicken Benchmark\footcite{tresp_wet_1994,hans_efficient_2009}}
\begin{itemize}
\item High level ideas about the benchmark
\item Probably can just skip the true dynamics?
@ -139,16 +143,54 @@
\end{frame}
\begin{frame}[label=policy]{Policy}
\centering
\begin{columns}[T]
\begin{column}{.45\textwidth}
\includestandalone{figures/policy_quiver}
\end{column}
\begin{column}{.5\textwidth}
\centering
\sisetup{
table-format=-1.2(2),
table-number-alignment=center,
separate-uncertainty,
% table-align-uncertainty,
table-figures-uncertainty=1,
detect-weight,
}
\newcommand{\winner}{{\cellcolor{mStructure!40}}\bfseries}
\footnotesize
\vspace{4ex}
\begin{tabular}{cSSS}
\toprule
{N} & {NFQ\footnotemark} & {GP\footnotemark} & {DAGP} \\
\midrule
100 & 0.66 \pm 0.16 & \winner 1.41 \pm 0.01 & 1.18 \pm 0.09 \\
250 & 1.71 \pm 0.07 & 1.54 \pm 0.01 & \winner 2.33 \pm 0.01 \\
500 & 1.60 \pm 0.10 & 1.56 \pm 0.01 & \winner 2.25 \pm 0.01 \\
1000 & 1.99 \pm 0.06 & 2.13 \pm 0.01 & \winner 2.32 \pm 0.01 \\
2500 & \winner 2.26 \pm 0.02 & 1.91 \pm 0.01 & \winner 2.28 \pm 0.01 \\
5000 & \winner 2.33 \pm 0.01 & 1.91 \pm 0.01 & 2.28 \pm 0.01 \\
\bottomrule
\end{tabular}
\end{column}
\end{columns}
\footnotetext[1]{\cite{riedmiller_neural_2005}}
\footnotetext[2]{\cite{deisenroth_pilco_2011}}
\end{frame}
\begin{frame}[label=results]{Interpretable Results}
\centering
\includestandalone{figures/falldown_probabilities}
\includestandalone{figures/hetero_noise}
\end{frame}
\appendix
\begin{frame}[label=policy]{Policy}
\centering
\includestandalone{figures/policy_quiver}
\begin{frame}[label=bibliography, allowframebreaks]
\printbibliography
\end{frame}
\end{document}

+ 7
- 0
zotero_export.bib View File

@ -84,4 +84,11 @@
url = {https://www.tensorflow.org/}
}
@article{tresp_wet_1994,
author = {Tresp, Volker},
date = {1994},
journaltitle = {Siemens AG, CT IC 4, Technical Report},
title = {The Wet Game of Chicken}
}

Loading…
Cancel
Save