Skip to content

Commit a65d266

Browse files
committed
V0.9
1 parent 63c4b48 commit a65d266

File tree

17 files changed

+1462
-53
lines changed

17 files changed

+1462
-53
lines changed

doc/doc.aux

Lines changed: 105 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,105 @@
1+
\relax
2+
\providecommand\hyper@newdestlabel[2]{}
3+
\providecommand\HyperFirstAtBeginDocument{\AtBeginDocument}
4+
\HyperFirstAtBeginDocument{\ifx\hyper@anchor\@undefined
5+
\global\let\oldcontentsline\contentsline
6+
\gdef\contentsline#1#2#3#4{\oldcontentsline{#1}{#2}{#3}}
7+
\global\let\oldnewlabel\newlabel
8+
\gdef\newlabel#1#2{\newlabelxx{#1}#2}
9+
\gdef\newlabelxx#1#2#3#4#5#6{\oldnewlabel{#1}{{#2}{#3}}}
10+
\AtEndDocument{\ifx\hyper@anchor\@undefined
11+
\let\contentsline\oldcontentsline
12+
\let\newlabel\oldnewlabel
13+
\fi}
14+
\fi}
15+
\global\let\hyper@last\relax
16+
\gdef\HyperFirstAtBeginDocument#1{#1}
17+
\providecommand\HyField@AuxAddToFields[1]{}
18+
\providecommand\HyField@AuxAddToCoFields[2]{}
19+
\citation{Deisenroth2011c}
20+
\citation{Deisenroth2011b}
21+
\citation{Sutton1998}
22+
\citation{Bagnell2001}
23+
\citation{Deisenroth2011c}
24+
\citation{Deisenroth2011c}
25+
\citation{Deisenroth2011b}
26+
\citation{Deisenroth2010b}
27+
\@writefile{toc}{\contentsline {chapter}{\numberline {1}Introduction}{1}{chapter.1}}
28+
\@writefile{lof}{\addvspace {10\p@ }}
29+
\@writefile{lot}{\addvspace {10\p@ }}
30+
\@writefile{toc}{\contentsline {section}{\numberline {1.1}Intended Use}{1}{section.1.1}}
31+
\citation{Rasmussen2006}
32+
\citation{Snelson2006}
33+
\citation{Quinonero-Candela2003a}
34+
\citation{Deisenroth2011c}
35+
\@writefile{lof}{\contentsline {figure}{\numberline {1.1}{\ignorespaces Main modules: After an initialization, the first module is responsible for training a GP from available data. The second module is used for policy learning, which consists of policy evaluation and improvement. The third module is responsible for applying the learned policy to the system, which can be either a simulated system or a real system, such as a robot. The collected data from this application is used for updating the model, and the cycle starts from the beginning.}}{2}{figure.1.1}}
36+
\newlabel{fig:modules}{{1.1}{2}{Main modules: After an initialization, the first module is responsible for training a GP from available data. The second module is used for policy learning, which consists of policy evaluation and improvement. The third module is responsible for applying the learned policy to the system, which can be either a simulated system or a real system, such as a robot. The collected data from this application is used for updating the model, and the cycle starts from the beginning}{figure.1.1}{}}
37+
\@writefile{toc}{\contentsline {section}{\numberline {1.2}Software Design and Implementation}{2}{section.1.2}}
38+
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.1}Model Learning}{2}{subsection.1.2.1}}
39+
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.2}Policy Learning}{2}{subsection.1.2.2}}
40+
\citation{Deisenroth2011b}
41+
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.3}Policy Application}{3}{subsection.1.2.3}}
42+
\@writefile{toc}{\contentsline {section}{\numberline {1.3}User Interface by Example}{4}{section.1.3}}
43+
\@writefile{toc}{\contentsline {section}{\numberline {1.4}Quick Start}{4}{section.1.4}}
44+
\citation{Deisenroth2011c}
45+
\@writefile{toc}{\contentsline {chapter}{\numberline {2}Software Package Overview}{5}{chapter.2}}
46+
\@writefile{lof}{\addvspace {10\p@ }}
47+
\@writefile{lot}{\addvspace {10\p@ }}
48+
\@writefile{toc}{\contentsline {section}{\numberline {2.1}Main Modules}{5}{section.2.1}}
49+
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1.1}\texttt {applyController}}{6}{subsection.2.1.1}}
50+
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1.2}\texttt {trainDynModel}}{7}{subsection.2.1.2}}
51+
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1.3}\texttt {learnPolicy}}{7}{subsection.2.1.3}}
52+
\@writefile{lof}{\contentsline {figure}{\numberline {2.1}{\ignorespaces Functions being called from \texttt {learnPolicy.m} for learning the policy.}}{8}{figure.2.1}}
53+
\newlabel{fig:learnP}{{2.1}{8}{Functions being called from \texttt {learnPolicy.m} for learning the policy}{figure.2.1}{}}
54+
\@writefile{toc}{\contentsline {section}{\numberline {2.2}Working with a Real Robot}{8}{section.2.2}}
55+
\citation{Deisenroth2011b}
56+
\citation{Deisenroth2011c}
57+
\citation{Snelson2006}
58+
\@writefile{toc}{\contentsline {chapter}{\numberline {3}Important Function Interfaces}{10}{chapter.3}}
59+
\@writefile{lof}{\addvspace {10\p@ }}
60+
\@writefile{lot}{\addvspace {10\p@ }}
61+
\@writefile{toc}{\contentsline {section}{\numberline {3.1}GP Predictions}{10}{section.3.1}}
62+
\@writefile{lot}{\contentsline {table}{\numberline {3.1}{\ignorespaces Overview of functions for GP predictions with Gaussian distributed test inputs.}}{10}{table.3.1}}
63+
\newlabel{tab:gpP overview}{{3.1}{10}{Overview of functions for GP predictions with Gaussian distributed test inputs}{table.3.1}{}}
64+
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1.1}Input Arguments}{11}{subsection.3.1.1}}
65+
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1.2}Output Arguments}{11}{subsection.3.1.2}}
66+
\@writefile{toc}{\contentsline {section}{\numberline {3.2}Controller}{12}{section.3.2}}
67+
\@writefile{toc}{\contentsline {subsection}{\numberline {3.2.1}Interface}{12}{subsection.3.2.1}}
68+
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.2.1.1}Input Arguments}{12}{subsubsection.3.2.1.1}}
69+
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.2.1.2}Output Arguments}{13}{subsubsection.3.2.1.2}}
70+
\@writefile{toc}{\contentsline {section}{\numberline {3.3}Cost Functions}{13}{section.3.3}}
71+
\@writefile{toc}{\contentsline {subsection}{\numberline {3.3.1}Interface for Scenario-specific Cost Functions}{13}{subsection.3.3.1}}
72+
\@writefile{toc}{\contentsline {paragraph}{Input Arguments}{14}{section*.2}}
73+
\newlabel{eq:UCB cost}{{3.1}{14}{Input Arguments}{equation.3.3.1}{}}
74+
\@writefile{toc}{\contentsline {paragraph}{Output Arguments}{14}{section*.3}}
75+
\@writefile{toc}{\contentsline {subsection}{\numberline {3.3.2}General Building Blocks}{14}{subsection.3.3.2}}
76+
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.3.2.1}Saturating Cost}{14}{subsubsection.3.3.2.1}}
77+
\@writefile{lol}{\contentsline {lstlisting}{lossSat}{14}{lstlisting.3.-8}}
78+
\citation{Deisenroth2010b}
79+
\citation{Deisenroth2010b}
80+
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.3.2.2}Quadratic Cost}{16}{subsubsection.3.3.2.2}}
81+
\@writefile{lol}{\contentsline {lstlisting}{lossQuad}{16}{lstlisting.3.-14}}
82+
\@writefile{toc}{\contentsline {paragraph}{Input arguments}{16}{section*.5}}
83+
\citation{Deisenroth2010b}
84+
\citation{Deisenroth2010b}
85+
\@writefile{toc}{\contentsline {chapter}{\numberline {4}How to Create Your Own Scenario}{19}{chapter.4}}
86+
\@writefile{lof}{\addvspace {10\p@ }}
87+
\@writefile{lot}{\addvspace {10\p@ }}
88+
\@writefile{toc}{\contentsline {section}{\numberline {4.1}Necessary Files}{19}{section.4.1}}
89+
\@writefile{toc}{\contentsline {section}{\numberline {4.2}ODE Dynamics}{19}{section.4.2}}
90+
\@writefile{lol}{\contentsline {lstlisting}{dynamics\textunderscore cp}{19}{lstlisting.4.-19}}
91+
\citation{Deisenroth2010b}
92+
\@writefile{toc}{\contentsline {section}{\numberline {4.3}Scenario-specific Settings}{20}{section.4.3}}
93+
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.1}Adding Paths}{20}{subsection.4.3.1}}
94+
\@writefile{lol}{\contentsline {lstlisting}{settings\textunderscore cp}{20}{lstlisting.4.-22}}
95+
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.2}Indices}{21}{subsection.4.3.2}}
96+
\newlabel{eq:aux state}{{4.1}{22}{Indices}{equation.4.3.1}{}}
97+
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.3}General Settings}{22}{subsection.4.3.3}}
98+
\@writefile{lof}{\contentsline {figure}{\numberline {4.1}{\ignorespaces Preliminary policy $\mathaccentV {tilde}07E\pi $ and squashed policy $\pi $. The squashing function ensures that the control signals $\boldsymbol {u} = \pi (\boldsymbol {x})$ do not exceed the values $\pm \boldsymbol {u}_{\qopname \relax m{max}}$.}}{23}{figure.4.1}}
99+
\newlabel{eq:squashed rbf policy}{{4.3}{23}{General Settings}{equation.4.3.3}{}}
100+
\newlabel{eq:unsquashed rbf policy}{{4.4}{23}{General Settings}{equation.4.3.4}{}}
101+
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.4}Plant Structure}{23}{subsection.4.3.4}}
102+
\citation{Deisenroth2011c}
103+
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.5}Policy Structure}{24}{subsection.4.3.5}}
104+
\@writefile{lof}{\contentsline {figure}{\numberline {4.2}{\ignorespaces Squashing function.}}{25}{figure.4.2}}
105+
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.6}Cost Function Structure}{25}{subsection.4.3.6}}

0 commit comments

Comments
 (0)