-
Notifications
You must be signed in to change notification settings - Fork 0
/
aixi.sty
62 lines (56 loc) · 1.82 KB
/
aixi.sty
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% AIXI-related formatting rules
%
% written by Jan Leike 2014
%
\usepackage{amsmath}
%---------------------------%
% Argmax and Argmin
\DeclareMathOperator*{\argmax}{arg\,max} % argmax operator
\DeclareMathOperator*{\argmin}{arg\,min} % argmin operator
%---------------------------%
% Actions, percepts, observations, and histories
\def\A{\mathcal{A}} % set of actions
\def\E{\mathcal{E}} % set of percepts
\def\H{(\A \times \E)^*} % history
\let\aechar\ae % change the name of \ae so we can redefine it
\renewcommand{\ae}{
\ifmmode\mathchoice{
\mbox{\textsl{\aechar}}
}{
\mbox{\textsl{\aechar}}
}{
\mbox{\scriptsize\textsl{\aechar}}
}{
\mbox{\scriptsize\textsl{\aechar}}
}\else\aechar\fi%
} % action-percept tuple
%---------------------------%
% Measures
\def\dmid{\parallel} % double mid
\def\leadsto{\rightarrow} % conditional probability
\newcommand{\interleaved}[2]{%
{\mathchoice{
{\scriptscriptstyle\overleftrightarrow{\mbox{\vphantom{\footnotesize I}\normalsize${#1}\hspace{-1pt}{#2}$}}}%
}{
{\scriptscriptstyle\overleftrightarrow{\mbox{\vphantom{\footnotesize I}\normalsize${#1}\hspace{-1pt}{#2}$}}}%
}{
{\scriptscriptstyle\overleftrightarrow{\mbox{\vphantom{\tiny I}$\scriptstyle {#1}\hspace{-1pt}{#2}$}}}%
}{
{\scriptscriptstyle\overleftrightarrow{\mbox{$\scriptscriptstyle {#1}\hspace{-1pt}{#2}$}}}%
}}} % agent and environment interleaved
%---------------------------%
% Expectimax operator
\usepackage{relsize}
\newcommand{\expectimax}[1]{%
\mathchoice{
\ooalign{\hss$\max$\hss\cr$\mathlarger{\sum}\limits_{#1}$}
}{
\ooalign{\hss$\sum$\hss\cr$\max$}_{#1}
}{}{}
}
%---------------------------%
% Deprecated macros (used in old formalism)
\def\O{\mathcal{O}} % set of observations
\def\ao{{a\hspace{-1.4pt}o}} % action-observation tuple
\def\interleave{\rightleftarrows}