paradyx/ma-tex - Change QIVGMR6INKBVT5IFCO2UJJQEO4PVW3ZM7IDTCTCOKOX7VKG7UPFAC

WIP

Created by paradyx on June 7, 2023

QIVGMR6INKBVT5IFCO2UJJQEO4PVW3ZM7IDTCTCOKOX7VKG7UPFAC

Dependencies

In channels

main

Change contents

Insertion in literature.bib at line 661 [3.18034]

[2.1152]

}
@InProceedings{gulwani2009,
  author    = {Sumit Gulwani and Sagar Jain and Eric Koskinen},
  booktitle = {Proceedings of the 2009 {ACM} {SIGPLAN} Conference on Programming Language Design and Implementation, {PLDI} 2009, Dublin, Ireland, June 15-21, 2009},
  title     = {Control-flow refinement and progress invariants for bound analysis},
  year      = {2009},
  editor    = {Michael Hind and Amer Diwan},
  pages     = {375--385},
  publisher = {{ACM}},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  biburl    = {https://dblp.org/rec/conf/pldi/GulwaniJK09.bib},
  doi       = {10.1145/1542476.1542518},
  file      = {:/home/paradyx/MA/literatur/gulwani2009.pdf:PDF},
  groups    = {Partial Evaluation},
  timestamp = {Fri, 25 Jun 2021 14:48:54 +0200},
  url       = {https://doi.org/10.1145/1542476.1542518},

Insertion in literature.bib at line 680 [3.18034]

[2.1155]

[3.35999]

@InProceedings{gallagher2019eptcs,
  author    = {John P. Gallagher},
  booktitle = {Proceedings Seventh International Workshop on Verification and Program Transformation, VPT@Programming 2019, Genova, Italy, 2nd April 2019},
  title     = {Polyvariant Program Specialisation with Property-based Abstraction},
  year      = {2019},
  editor    = {Alexei Lisitsa and Andrei P. Nemytykh},
  pages     = {34--48},
  series    = {{EPTCS}},
  volume    = {299},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  biburl    = {https://dblp.org/rec/journals/corr/abs-1908-07189.bib},
  doi       = {10.4204/EPTCS.299.6},
  file      = {:/home/paradyx/MA/literatur/gallagher2019eptcs.pdf:PDF},
  groups    = {Partial Evaluation},
  timestamp = {Fri, 03 Jun 2022 08:18:12 +0200},
  url       = {https://doi.org/10.4204/EPTCS.299.6},
}

File addition: ch2_ex_pip_probs.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[program,initial left]
    \node[state,initial]    (l0)                       {$l_0$};
    \node[state] (l1) [right=3cm of l0] {$l_1$};
    \node[state] (l2) [right=3cm of l1] {$l_2$};
    \path[->]   (l0) edge node {$t_1:\textit{true}$} (l1)
                (l1) edge node {$t_3:x \leq 0$}      (l2)
                     edge[loop above] node {$t_2: \begin{aligned}
                         x &> 0 \\
                         x &:= x - \textsc{Bern}(0.5)
                     \end{aligned}$}
                         ()
                    ;
\end{tikzpicture}

File addition: ch2_ex_pip_prob.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[program,initial left]
    \node[state,initial]    (l0)                       {$l_0$};
    \node[state] (l1) [right=3cm of l0] {$l_1$};
    \node[state] (l2) [right=3cm of l1] {$l_2$};
    \path[->]   (l0) edge node {$t_1:\textit{true}$} (l1)
                (l1) edge node {$t_5:x \leq 0$}      (l2)
                     edge[in=100,out=145,looseness=15,draw=rot-75] node[above
                     left] {$t_2:\begin{aligned} p&=0.5 \\ x &> 0 \\ x&:=
                     x+1\end{aligned}$} (l1)
                     edge[in=35,out=80,looseness=15,draw=rot-75] node[above right] {$t_3:\begin{aligned}
                         p&=0.5 \\x &> 0 \\ x&:=
                     x+2\end{aligned}$} (l1)
                     edge[loop below] node  {$t_4:\begin{aligned} x &> 0 \\ x&:=
                     x-1\end{aligned}$} ()
                    ;
\end{tikzpicture}

File addition: ch2_ex_pip_nds.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[program,initial left]
    \node[state,initial]    (l0)                       {$l_0$};
    \node[state] (l1) [right=3cm of l0] {$l_1$};
    \node[state] (l2) [right=3cm of l1] {$l_2$};
    \path[->]   (l0) edge node {$t_1:\textit{true}$} (l1)
                (l1) edge[loop above] node {$t_2: \
                \begin{aligned} 
                    x & > 0 \\
                    1 &\leq t \leq 3 \\
                    x &:= x - t
                \end{aligned}$} ()
                (l1) edge node {$t_3:x \leq 0$}      (l2)
                    ;
\end{tikzpicture}

File addition: ch2_ex_pip_nd.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[program,initial left]
    \node[state,initial]    (l0)                       {$l_0$};
    \node[state] (l1) [right=3cm of l0] {$l_1$};
    \node[state] (l2) [right=3cm of l1] {$l_2$};
    \path[->]   (l0) edge node {$t_1:\textit{true}$} (l1)
                (l1) edge node {$t_4:x \leq 0$}      (l2)
                     edge[loop above] node {$t_2:\begin{aligned} x &> 1 \\ x&:=
                     x+1\end{aligned}$} ()
                     edge[loop below] node  {$t_3:\begin{aligned} x &> 0 \\ x&:=
                     x-1\end{aligned}$} ()
                    ;
\end{tikzpicture}

File addition: ch2_abstract_domains_poly.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=0,
        xmax=6.3,
        ymin=0,
        ymax=5.3,
        y=1cm,
        x=1cm,
        ytick={0,...,5},
        xtick={0,...,6},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        % Octagon
        \addplot[mark=none,draw=black,fill=rwth-50] coordinates {(1,2) (1,3)
        (3,4) (4,4) (5,2) (4,1) (2,1)} -- cycle;
        % Constraints
        % -x + 2y = 5
        \addplot[mark=none,dashed] {(x +5)/2};
        % y = 4
        \addplot[mark=none,dashed] {4};
        % 2x + y = 12
        \addplot[mark=none,dashed] {-2*x + 12};
        % x - y = 3
        \addplot[mark=none,dashed] {x - 3};
        % y = 1
        \addplot[mark=none,dashed] {1};
        % x + y = 3
        \addplot[mark=none,dashed] {-x + 3};
        % x = 1
        \addplot[mark=none,dashed] coordinates {(1, 0) (1,5.3)};
        
        % Points
        \addplot[only marks,mark=o] coordinates {
                        (3,4) (4,4)
            (1,3) (2,3) (3,3) (4,3) 
            (1,2) (2,2) (3,2) (4,2) (5,2)
                  (2,1) (3,1) (4,1) 
        };
    \end{axis} 
\end{tikzpicture}

File addition: ch2_abstract_domains_oct.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=0,
        xmax=6.3,
        ymin=0,
        ymax=5.3,
        y=1cm,
        x=1cm,
        ytick={0,...,5},
        xtick={0,...,6},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        % Octagon
        \addplot[mark=none,draw=black,fill=rwth-50] coordinates {(1,2) (1,3)
        (2,4) (4,4) (5,3) (3,1) (2,1)} -- cycle;
        % Constraints
        % x = 1
        \addplot[mark=none,dashed] coordinates {(1, 0) (1,5.3)};
        % -x + y = 2
        \addplot[mark=none,dashed] {x + 2};
        % y = 4
        \addplot[mark=none,dashed] {4};
        % x + y = 8
        \addplot[mark=none,dashed] {-x + 8};
        % -x + y = -2
        \addplot[mark=none,dashed] {x - 2};
        % y = 1
        \addplot[mark=none,dashed] {1};
        % x + y = 3
        \addplot[mark=none,dashed] {-x + 3};
        
        % Points
        \addplot[only marks,mark=o] coordinates {
                  (2,4) (3,4) (4,4)
            (1,3) (2,3) (3,3) (4,3) (5,3)
            (1,2) (2,2) (3,2) (4,2) 
                  (2,1) (3,1) 
        };
    \end{axis} 
\end{tikzpicture}

File addition: ch2_abstract_domains_box.tex (----------)

[4.7550]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=0,
        xmax=6.3,
        ymin=0,
        ymax=5.3,
        y=1cm,
        x=1cm,
        ytick={0,...,5},
        xtick={0,...,6},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        % Box
        \addplot[mark=none,draw=black,fill=rwth-50] coordinates {(1,2) (1,4) (5,4) (5,2)} -- cycle;
        % Intervals
        \addplot[mark=none,dashed] coordinates {(1,0) (1,2)};
        \addplot[mark=none,dashed] coordinates {(5,0) (5,2)};
        \addplot[mark=none,dashed] coordinates {(0,2) (1,2)};
        \addplot[mark=none,dashed] coordinates {(0,4) (1,4)};
        % Points
        \addplot[only marks,mark=o] coordinates {
            (1,4) (2,4) (3,4) (4,4) (5,4)
            (1,3) (2,3) (3,3) (4,3) (5,3)
            (1,2) (2,2) (3,2) (4,2) (5,2)
        };
    \end{axis} 
\end{tikzpicture}

Insertion in ch4_implementation.tex at line 48 [4.7792]

[3.37047]

\end{comment}
\section{Modules}
The code specific to this thesis is split into a couple of modules. The code is
fully commented. Nonetheless, this section gives a short overview over the
modules to ease the understanding of the code. 
\subsection{Loops}
\subsection{PartialEvaluation}
\subsection{Abstraction}
\section{Command-Line Interface}
The techniques described above were implemented natively in Koat2. They are
available as part of the normal analysis via the flags \texttt{--cfr-native}.
The old option for control-flow refinement \texttt{--cfr} was renamed to
\texttt{--cfr-ir}, and can probably be removed in the future. 
During normal analysis the control-flow refinement is done on every \gls{scc}
and the bounds of the resulting scc is compared to the previous bounds. 
A full program can be refined using the native control-flow refinement with a
separate command \texttt{cfr}. For the new control-flow refinement the option is
added to switch between the various method to select location for abstraction
and the abstraction method itself (see \Sref{sec:abstraction}). An summary of
the compatible options is given in \tref{tab:options}. 
As discussed in \Sref{sec:updateinvariants} the polyhedra computed during
evaluation are tighter than the invariants computed during preprocessing. In
order to update the invariants after the partial evaluation a new option
\texttt{--update-invariants} is added and activated by default. 
% \begin{table}
%     \center
%     \begin{tabular}[ccc]
%         \hline
%         \begin{comment}
%         analysis --cfr=native,update-invariants,     --o
%                  --cfr=irankfinder,
%                  --cfr=off
%         prob-analysis --cfr=native
%         cfr --native
%             --irankfinder
%         \end{comment}
%         \hline
%     \end{tabular}
%     \caption{}
% \end{table}
\begin{comment}
    cfr --

Insertion in ch4_implementation.tex at line 100 [4.7792]
[3.37061]
[5.427]
```
The implementation is \gls{koat} can be 
```
Insertion in ch4_implementation.tex at line 107 [4.7792]
[4.7871]
[4.7879]
Insertion in ch4_implementation.tex at line 109 [4.7792]
[4.7901]
```
The project was compiled with OCaml 4.14.0. 
```

Insertion in ch3_theory.tex at line 3 [4.7949]

[4.7973]

[6.710]

\section{Program equivalence}
\begin{definition}[Program equivalence]
    Given two PIP $P = (\V, L, \GT, l_0)$ and $P' = (\V, L', \GT', l_0)$
    are equivalent if and only if the following properties hold:
    \begin{enumerate}
        \item \todo{continue}
    \end{enumerate}
\end{definition}

Replacement in ch3_theory.tex at line 101 [4.7949]
B:BD[7.2943] → [6.784:806]
```
\section{Abstraction}
```
[7.2943]
[7.2943]
```
\section{Abstraction}\label{sec:abstraction}
```

Replacement in ch3_theory.tex at line 221 [4.7949]

B:BD[2.7150] → [2.7150:7227]

A hitting set problem can be formulated as a \gls{lip} and solved by readily

[2.7150]

[2.7227]

A hitting set problem can be formulated as a \gls{ilp} and solved by readily

Replacement in ch3_theory.tex at line 223 [4.7949]

B:BD[2.7307] → [2.7307:7384]

the \gls{lip} used for finding the feedback vertex set of an integer program

[2.7307]

[2.7384]

the \gls{ilp} used for finding the feedback vertex set of an integer program

Replacement in ch3_theory.tex at line 229 [4.7949]

B:BD[2.7572] → [2.7572:7641]

    {}{\sum_{i=1}^{n} x_i\label{eq:lip1-goal}}{\label{eq:lip-vfs}}{}

[2.7572]

[2.7641]

    {}{\sum_{i=1}^{n} x_i\label{eq:lip1-goal}}{\label{eq:ilp-vfs}}{}

Replacement in ch3_theory.tex at line 232 [4.7949]

B:BD[2.7760] → [2.7760:7926]

    \addConstraint{ x_i }{\leq 1,\protect\quad\label{eq:lip1-leq1}}{i = 1,\dots,n}
    \addConstraint{ x_i }{\geq 0,\protect\quad\label{eq:lip1-geq0}}{i = 1,\dots,n}

[2.7760]

[2.7926]

    \addConstraint{ x_i }{\leq 1,\protect\quad\label{eq:ilp-leq1}}{i = 1,\dots,n}
    \addConstraint{ x_i }{\geq 0,\protect\quad\label{eq:ilp-geq0}}{i = 1,\dots,n}

Replacement in ch3_theory.tex at line 236 [4.7949]

B:BD[2.7939] → [2.7939:8018]

Every variable $x_i$ of the \gls{lip} \ref{eq:lip-vfs} indicates if a location

[2.7939]

[2.8018]

Every variable $x_i$ of the \gls{ilp} \ref{eq:ilp-vfs} indicates if a location

Replacement in ch3_theory.tex at line 239 [4.7949]

B:BD[2.8165] → [2.8165:8390]

\ref{eq:lip1-hit} guarantees that every loop is \enquote{hit}, while
\ref{eq:lip1-leq1} and \ref{eq:lip1-geq0} enforce that every location is only
selected at most once. The optimization goal \ref{eq:lip-vfs} being to select

[2.8165]

[2.8390]

\ref{eq:ilp-hit} guarantees that every loop is \enquote{hit}, while
\ref{eq:ilp-leq1} and \ref{eq:ilp-geq0} enforce that every location is only
selected at most once. The optimization goal \ref{eq:ilp-vfs} being to select

Deletion in ch2_preliminaries.tex at line 4 [4.8115]

B:BD[8.18094] → [8.18094:19053]

∅:D[8.19053] → [4.8138:8139]

B:BD[4.8138] → [4.8138:8139]

B:BD[4.8139] → [8.19054:20473]

\begin{comment}
    # Textbautsteine
    --- 
    For random program variables in this thesis, $\Omega$ will be the set of
    integers and $\mathcal{F}$ the maximal $\sigma$-field in $\Omega$, the
    power-set $2^\Omega$. However since the program variables are chosen at
    random, a specific path over a given program can also be considered a random
    event in the probability space and hence be considered as a ransom variable.
    In this case $\Omega$ is the set of all runs $\mathcal{Runs}$. The exact
    definition will be introduced later on in \Sref{}.
    ---
    \begin{definition}[Linear Constraints] 
        Let $V$ be a fixed set of integer
        Variables $\{x_1, x_2, \dots, n\} $. A linear constraint is defined as $\psi
        = a_0 + a_1 x_1 + \dots + a_n x_n \diamond 0$ where $a_i \in \mathbb{N}$ are
        integer coefficients, $x_i \in V$ are variables and $\diamond \in \{>, <, 
        \geq, \leq, =\}$. \end{definition}
    \begin{definition}[Assignment] 
        An assignment $\sigma : V \mapsto \mathbb{Z}$ assigns an integer value to
        each variable in $V$. $\sigma$ is a solution for a linear constraint $\psi$
    \end{definition} \
    Common operations can be defined over probability distributions as well, which
    will be very handy in probabilistic integer programs. Given two probability
    distributions $p$, and $q$, the following operations are defined:
    \begin{equation*}
        p \diamond q (x) = \sum_{\substack{i,j \in \Z \\ i \diamond j = x}} p(i)
        \cdot q(i) \hspace{1cm} \with \diamond \in \{+, \cdot\}
    \end{equation*}
    \todo{more operators?}
    In the context of this thesis the discrete bounded distributions will be used to
    describe the possible values of a variable. They can be used as if they were
    non-probabilistic values, for exymple and 
    It can be used inside the 
    A note non-probabilistic (fixed) value $k$ is equivalent to a distribution which
    assignes the probability $1$ to this fixed value $k$ and $0$ to every other
    value.
    program itself during assignments when setting a new value to a variable or 
    during analysis to describe the possible values of the variables at a certain
    configuration. 
    \[
        p_k(x) = \begin{cases} 
            1, & x = k \\
            0, & \text{otherwise}
        \end{cases}
    \]
\end{comment}

Deletion in ch2_preliminaries.tex at line 5 [4.8115]

∅:D[9.7464] → [4.8163:8365]

∅:D[8.20474] → [4.8163:8365]

B:BD[4.8163] → [4.8163:8365]

B:BD[4.8365] → [6.2638:2988]

∅:D[6.2988] → [4.8365:8379]

B:BD[4.8365] → [4.8365:8379]

\begin{comment}
- Term Rewrite Systems (TRS)
- Transition Systems
    - A set of States S
    - A start location S_0 \in S
    - A set of transitions T \in S x C x S
- Integer Transition Systems (ITS)
Koat2 can work on integer programs with polynomial integer
arithmetic.\cite{Brockschmidt16} To represent states and invariants in such a
program, one needs polynomial constraints. As an extended concept Koat2 uses
boxes and we will use polyhedra for the partial evaluation. Since those concepts
are closely related we will introduce them together. 
\end{comment}

Replacement in ch2_preliminaries.tex at line 16 [4.8115]
∅:D[10.311] → [11.269:315]
∅:D[2.10360] → [11.269:315]
B:BD[11.269] → [11.269:315]
```
\newcommand{\GT}[0]{GT} % General transitions
```
[2.10360]
[11.315]
```
\newcommand{\GT}[0]{\mathcal{GT}} % General transitions
\newcommand{\T}[0]{\mathcal{T}} % General transitions
```

Replacement in ch2_preliminaries.tex at line 28 [4.8115]

B:BD[12.445] → [2.10434:10458]

\section{Preliminaries}

[12.445]

[2.10458]

\newcommand{\confs}[0]{\textbf{\textsf{Conf}}}
\newcommand{\runs}[0]{\textbf{\textsf{Runs}}}
\newcommand{\fpath}[0]{\textbf{\textsf{FPath}}}
\section{Preliminaries}\label{sec:preliminaries}
\subsection{Constraints}\label{ssec:constraints}

Replacement in ch2_preliminaries.tex at line 36 [4.8115]

B:BD[2.10613] → [2.10613:10639]

standard real arithmetic.

[2.10613]

[13.162]

standard real arithmetic. In the following $\V$ denotes a finite set of
variables $\V$.

Replacement in ch2_preliminaries.tex at line 39 [4.8115]
B:BD[13.163] → [8.20522:20544]
B:BD[8.20544] → [2.10640:10735]
∅:D[12.805] → [10.777:778]
∅:D[2.10735] → [10.777:778]
∅:D[8.20544] → [10.777:778]
B:BD[13.560] → [10.777:778]
B:BD[10.778] → [2.10736:10768]
```
\section{Constraints}
In the following $\V$ denotes a countable finite set of variables $\V = \{v_1,
\dots, v_n\}$. 
\begin{definition}[Constraints]
```
[13.163]
[2.10768]
```
\begin{definition}[Constraints]\label{def:constraints}
```
Deletion in ch2_preliminaries.tex at line 51 [4.8115]
B:BD[10.1423] → [6.3380:3381]
Replacement in ch2_preliminaries.tex at line 52 [4.8115]
B:BD[2.11311] → [2.11311:11347]
```
linear constraints denoted as $\L$.
```
[2.11311]
[12.956]
```
linear constraints denoted as $\L := \L^{\leq} \union \L^{<}$.
```

Replacement in ch2_preliminaries.tex at line 57 [4.8115]

B:BD[11.483] → [2.11444:11805]

\begin{definition}[Satisfiability]
    For a domain $D$ and a structure $\mathfrak{I} = (D, +, \cdot, 0, 1, \leq,
    <, =)$, a constraint $\psi \in \L$ is \textit{satisfiable} in when the formula
    $\psi$ is $\mathfrak{I} \models \psi$. We say a variable assignment $\beta: \V
    \rightarrow D$ \textit{satisfies} the constraint $\psi$ when $(\mathfrak{I},

[11.483]

[2.11805]

\begin{definition}[Satisfiability]\label{def:satisfiability}
    For a domain $A$ and a structure $\mathfrak{A} = (A, +, \cdot, 0, 1, \leq,
    <, =)$, a constraint $\psi \in \L$ is \textit{satisfiable} in when
    $\mathfrak{A} \models \psi$. We say a (total) variable assignment $\beta: \V
    \rightarrow A$ \textit{satisfies} the constraint $\psi$ when $(\mathfrak{A},

Replacement in ch2_preliminaries.tex at line 66 [4.8115]

B:BD[2.11913] → [2.11913:11988]

satisfiable and we write $\mathfrak{I} \models C$ instead of $\mathfrak{I}

[2.11913]

[2.11988]

satisfiable and we write $\mathfrak{A} \models C$ instead of $\mathfrak{A}

Replacement in ch2_preliminaries.tex at line 69 [4.8115]

B:BD[2.12146] → [2.12146:12230]

$\mathfrak{I} \models \psi$ and $(\mathfrak{I}, \beta) \models \psi$ respectively.

[2.12146]

[12.1249]

$\mathfrak{A} \models \psi$ and $(\mathfrak{A}, \beta) \models \psi$ respectively.

Replacement in ch2_preliminaries.tex at line 71 [4.8115]
B:BD[12.1250] → [12.1250:1280]
```
\begin{definition}[Solutions]
```
[12.1250]
[12.1280]
```
\begin{definition}[Solutions]\label{def:solutions}
```
Replacement in ch2_preliminaries.tex at line 86 [4.8115]
B:BD[12.2047] → [12.2047:2079]
```
\begin{definition}[Equivalence]
```
[12.2047]
[2.12608]
```
\begin{definition}[Equivalence]\label{def:equivalence}
```

Replacement in ch2_preliminaries.tex at line 92 [4.8115]

B:BD[10.2781] → [2.12778:12937]

In practice constraints are often provided in a more general form. Restricting
the constraints to a specific form does not limit it's practicality, since they

[10.2781]

[2.12937]

Note that the constraints are restricted to (strict) inequality against zero. In
practice constraints are often provided in a more general form. Restricting the
constraints to the specific form does not limit it's practicality, since they

Replacement in ch2_preliminaries.tex at line 96 [4.8115]

B:BD[2.13015] → [2.13015:13091]

\diamond e_2$ with the operators $\diamond \in \{=, >, <, \leq, \geq\}$ can

[2.13015]

[2.13091]

\diamond e_2$ with the operators $\diamond \in \{=, \leq, \geq, <, >\}$ and
$e_1, e_2 \in \mathbb{P}[\V]$ can

Replacement in ch2_preliminaries.tex at line 99 [4.8115]
∅:D[10.2781] → [13.1087:1102]
∅:D[2.13115] → [13.1087:1102]
B:BD[13.1087] → [13.1087:1102]
```
\begin{align*}
```
[2.13115]
[2.13116]
```
\begin{align}
```
Replacement in ch2_preliminaries.tex at line 106 [4.8115]
∅:D[10.2902] → [13.1187:1200]
∅:D[2.13365] → [13.1187:1200]
B:BD[13.1187] → [13.1187:1200]
```
\end{align*}
```
[2.13365]
[13.1434]
```
\end{align}
```

Replacement in ch2_preliminaries.tex at line 115 [4.8115]

B:BD[2.13698] → [2.13698:13784]

∅:D[10.2950] → [13.1691:1692]

∅:D[2.13784] → [13.1691:1692]

B:BD[13.1691] → [13.1691:1692]

B:BD[13.1692] → [2.13785:13840]

∅:D[10.3038] → [13.1801:1802]

∅:D[2.13840] → [13.1801:1802]

B:BD[13.1801] → [13.1801:1802]

B:BD[6.3954] → [6.3954:4339]

∅:D[13.1969] → [4.9093:9094]

∅:D[10.3217] → [4.9093:9094]

∅:D[6.4339] → [4.9093:9094]

B:BD[4.9093] → [4.9093:9094]

B:BD[4.9094] → [6.4340:4424]

B:BD[6.4424] → [8.20545:20631]

∅:D[8.20631] → [6.4488:4534]

B:BD[6.4488] → [6.4488:4534]

B:BD[6.4534] → [8.20632:20686]

∅:D[8.20686] → [6.4608:4654]

B:BD[6.4608] → [6.4608:4654]

B:BD[6.4654] → [8.20687:20769]

∅:D[8.20769] → [6.4756:4802]

B:BD[6.4756] → [6.4756:4802]

B:BD[6.4802] → [8.20770:21212]

∅:D[8.21212] → [6.4812:5479]

B:BD[6.4812] → [6.4812:5479]

∅:D[13.2010] → [11.484:485]

∅:D[10.3464] → [11.484:485]

∅:D[6.5479] → [11.484:485]

B:BD[4.9303] → [11.484:485]

B:BD[11.485] → [6.5480:6271]

When talking about integer arithmetic we will thus only refer to linear
constraints. 
\section{Abstract Domains}\label{sec:abstract_domains}
Another way of reasoning about constraints is to see them in an $n$-dimensional
space. Constraints partition the space excluding one half. In case of integer
arithmetic the solutions are discrete points in this space. Linear constraints
describe half-spaces and a set of linear constraints describes a (possibly
open) convex polyhedron. More about polyhedron in \Sref{sec:polyhedron}.
\begin{example}\label{ex:1}
    \begin{figure}[h]\label{fig:ex1}
        \centering
        \begin{subcaptiongroup}
            \subcaptionlistentry{Formula $\varphi_1$}
            \input{figures/ch1_example1_phi1}
            \subcaptionlistentry{Formula $\varphi_2$}
            \input{figures/ch1_example1_phi2}
            \subcaptionlistentry{Formula $\varphi_3 = \varphi_1 \land \varphi_2$}
            \input{figures/ch1_example1_phi3}
        \end{subcaptiongroup}
        % \subbottom[Formula $\varphi_1$]{
        %     \centering
        %     \input{figures/ch1_example1_phi1}
        % }
        % \subbottom[Formula $\varphi_2$]{
        %     \centering
        %     \input{figures/ch1_example1_phi2}
        % }
        % \subbottom[Formula $\varphi_3 = \varphi_1 \land \varphi_2$]{
        %     \centering
        %     \input{figures/ch1_example1_phi3}
        % }
        \caption{Graphical representation of the set of constraints $\varphi_1$,
        $\varphi_2$ and $\varphi_3$ from Example \ref{ex:1}. Every constraint is
        represented by a line and the excluded side is marked by hatchings. }
    \end{figure}
    Consider the following constraints over the variables $\V = \{x, y\}$:
    \begin{align}
        \varphi_1 &= 2y \leq x \\
        \varphi_2 &= 2y > x^2 - 4
    \end{align}
    They are graphically represented in \fref{fig:ex1} using a 2D-coordinate
    system. Since the space is two-dimensional the linear constraint $\varphi_1$
    can be represented as a straight line and $\varphi_2$ as a parabola. 
    The solutions are marked as circles. For example, the assignment $\sigma: x
    \mapsto 0, y \mapsto -2$ (colored red) satisfies $\varphi_1$ but not
    $\varphi_2$. The conjunction $\varphi_3 = \varphi_1 \land \varphi_2$ is
    clearly equal to the intersection of both sets of solutions. While
    $\varphi_1$ and $\varphi_2$ have infinitely many solutions, the conjunction
    $\varphi_3$ has not. 
\end{example}
The problem of determining, if a set of constraints is satisfiable or finding
valid variable assignments for a given formula is called \gls{smt}-solving and
is well researched. The theories relevant for this thesis the are
quantifier-free linear integer arithmetic (usually called \texttt{QF\_LIA}) and
quantifier-free polynomial integer arithmetic (\texttt{QF\_PIA}).

[2.13698]

[6.6271]

When talking about integer arithmetic on only refers to linear constraints.

Replacement in ch2_preliminaries.tex at line 150 [4.8115]

B:BD[6.7627] → [6.7627:7879]

Sometimes one want's to remove a variable from a formula or a set of
constraints. It is especially useful, when having a formula with temporary
variables that are only relevant to a certain transition but should not
influence the program after wards.

[6.7627]

[6.7879]

The problem of determining, if a set of constraints is satisfiable or finding
valid variable assignments for a given formula is part of \gls{smt} and is well
researched. The theories relevant for this thesis the are quantifier-free linear
integer arithmetic (usually called \texttt{QF\_LIA}) and quantifier-free
polynomial integer arithmetic (\texttt{QF\_PIA}).

Replacement in ch2_preliminaries.tex at line 156 [4.8115]

B:BD[6.7880] → [6.7880:8161]

Formally, removing a variable is equivalent to existentially quantifying it.
However, existential quantification is not available in quantifier free integer
arithmetic. Instead one searches for a formula that describes all original
solutions but restricted to the smaller domain.

[6.7880]

[13.2493]

Sometimes one is not interested in the result to all variables but only to a
subset of variables. It will later become relevant when handling temporary
variables that are only relevant to the scope of a transition. In FO-logic one
would just existentially quantify the variable. However the new FO-formula
wouldn't be quantifier-free anymore. Instead a new formula is searched that has
just the same solutions when ignoring the values for the irrelevant variables.

Replacement in ch2_preliminaries.tex at line 164 [4.8115]

B:BD[10.4097] → [6.8162:8333]

    Let $X \subseteq V$ and $\varphi$ be an FO-formula over the variables $V$
    and let $\sigma|_X$ denote the restriction of $\sigma$ to the smaller to
    domain $X$.

[10.4097]

[6.8333]

    Let $X \subseteq V$ and $\varphi$ be a quantifier-free FO-formula over the
    variables $V$ and let $\beta|_X$ denote the restriction of the assignment
    $\beta$ to the smaller to domain $X$.

Replacement in ch2_preliminaries.tex at line 168 [4.8115]

B:BD[6.8413] → [6.8413:8593]

    a formula $\varphi'$, with $\llbracket \varphi' \rrbracket =
    \set{\sigma|_X}{\sigma \in \llbracket \varphi \rrbracket}$. 
    \todo{use $\sigma$ and $\beta$ consistently.}

[6.8413]

[10.4436]

    a quantifier-free FO-formula $\varphi'$ over the variables $X$, with
    $\llbracket \varphi' \rrbracket = \set{\beta|_X}{\sigma \in \llbracket
    \varphi \rrbracket}$.

Insertion in ch2_preliminaries.tex at line 172 [4.8115]

[10.4453]

[13.2524]


The inverse operation is to add new variables and trivial, since it only
requires to add the new variables to the set of used variables.

Replacement in ch2_preliminaries.tex at line 176 [4.8115]

B:BD[13.2525] → [6.8594:8717]

Geometrically, the projection can be seen as set of solutions projected
(casting a shadow) onto the remaining dimensions.

[13.2525]

[6.8717]

\section{Abstract Domains}\label{sec:abstract_domains}
Another way of reasoning about solutions is to see them as points in an
$m$-dimensional space for variables $X \subset \V$ and $|X| = m$. Every
constraint partitions the space into one included and one excluded part. In case
of integer arithmetic the solutions are discrete points in this space. 
An abstract domains is a representation of those sets of points. Usually they
over-approximate the sets in order to facilitate operations. Commonly used
abstract domains are Polyhedra\cite{bagnara2005convexpolyhedron}
Octagons\cite{mine2001wcre, mine2007arxiv, mine2006hosc,truchet2010synacs}, and
the Interval domain\cite{}
\subsection{Operations}\label{ssec:ad_operations}
All abstract domains support the following operations with varying computational
and memory requirements: emptiness, intersection, inclusion test, orthogonal
projection, upper, and lower bounds. There are many more but we will focus only
on the ones important for this thesis. They all 
The test for emptiness is equivalent to asking if a formula is satisfiable as
every point represents a solution to the formula. Intersecting two or more
abstract values is equivalent to the conjunction of one or more formulas.
However, the intersection of two abstract values might include more values than
the solutions of the formula conjunction due to the approximative nature of
abstract domains. 
\begin{example}\label{ex:intersection}
    \begin{figure}[h]
        \centering
        \begin{subcaptionblock}[t]{0.3\textwidth}
            \input{figures/ch1_example1_phi1}
            \caption{Formula $\varphi_1$}
        \end{subcaptionblock}
        \begin{subcaptionblock}[t]{0.3\textwidth}
            \input{figures/ch1_example1_phi2}
            \caption{Formula $\varphi_2$}
        \end{subcaptionblock}
        \begin{subcaptionblock}[t]{0.3\textwidth}
            \input{figures/ch1_example1_phi3}
            \caption{Formula $\varphi_3 = \varphi_1 \land \varphi_2$}
        \end{subcaptionblock}
        \caption{Graphical representation of the set of constraints $\varphi_1$,
        $\varphi_2$ and $\varphi_3$ from Example \ref{ex:intersection}. Every constraint is
        represented by a line and the excluded side is marked by
        hatchings.\label{fig:ex_intersection} }
    \end{figure}
    Consider the following constraints over the variables $\V = \{x, y\}$:
    \begin{align}
        \varphi_1 &= 2y \leq x \\
        \varphi_2 &= 2y > x^2 - 4
    \end{align}
    They are graphically represented in \fref{fig:ex_intersection} using a
    2D-coordinate system. Since the space is two-dimensional the linear
    constraint $\varphi_1$ can be represented as a straight line and $\varphi_2$
    as a parabola. 
    The solutions are marked as circles. For example, the assignment $\sigma: x
    \mapsto 0, y \mapsto -2$ (colored red) satisfies $\varphi_1$ but not
    $\varphi_2$. The conjunction $\varphi_3 = \varphi_1 \land \varphi_2$ is
    clearly equal to the intersection of both sets of solutions. While
    $\varphi_1$ and $\varphi_2$ have infinitely many solutions, the conjunction
    $\varphi_3$ has not. 
\end{example}
The orthogonal projection computes the projection of an FO-formula, possibly
loosing some precision in the process. Geometrically, the projection can be seen
as set of solutions projected (casting a shadow) onto the remaining dimensions.

Deletion in ch2_preliminaries.tex at line 262 [4.8115]

B:BD[6.9406] → [2.13841:14075]

\subsection{Abstract domains}
An abstract domain is a representation for a set of points in an eu
Polyhedron\cite{bagnara2005convexpolyhedron}
Octagons\cite{mine2001wcre, mine2007arxiv, mine2006hosc,truchet2010synacs}
Interval domain

Replacement in ch2_preliminaries.tex at line 263 [4.8115]

B:BD[6.9407] → [2.14076:14321]

Among others the following operations are important to our use-case.
1. Emptiness
2. Intersection
3. Inclusion test
3. Orthogonal projection
4. Upper and lower bounds
\subsection{Not necessarily closed convex polyhedra}\label{ssec:nncpolyhedra}

[6.9407]

[2.14321]


In the following we will give a short introduction to the abstract domains. A
visual example for the three abstract domains is given in
\fref{fig:abstract_domains}. 
\begin{figure}
    \centering
    \begin{subcaptionblock}[t]{0.3\textwidth}
        \input{figures/ch2_abstract_domains_box}
        \caption{Interval domain (Box)\label{fig:abstract_domains_box}}
    \end{subcaptionblock}
    \begin{subcaptionblock}[t]{0.3\textwidth}
        \input{figures/ch2_abstract_domains_oct}
        \caption{Octagon domain\label{fig:abstract_domains_oct}}
    \end{subcaptionblock}
    \begin{subcaptionblock}[t]{0.3\textwidth}
        \input{figures/ch2_abstract_domains_poly}
        \caption{Polyhedra domain\label{fig:abstract_domains_poly}}
    \end{subcaptionblock}
    \caption{Visual comparison of the Interval domain, Octagons and
    Polyhedra\label{fig:abstract_domains}}
\end{figure}
\subsection{Not necessarily closed convex polyhedra}\label{ssec:polyhedra}

Replacement in ch2_preliminaries.tex at line 293 [4.8115]

B:BD[2.14683] → [2.14683:14736]

\begin{definition}[Not necessarily closed Polyhedra]

[2.14683]

[2.14736]

\begin{definition}[Not necessarily closed Polyhedra]\label{def:polyhedra}

Insertion in ch2_preliminaries.tex at line 299 [4.8115]

[2.14946]

As discussed in \Sref{sec:constraints} strictness of linear constraints and in
turn openness of half-spaces are not relevant to the integer domain. Hence when
talking about integer arithmetic one refers only to polyhedra. 
\todo{more about tightness of operations} 
\todo{say something about
overapproximation of polynomial constraints}

Replacement in ch2_preliminaries.tex at line 309 [4.8115]

B:BD[2.15063] → [2.15063:15122]

intervals (see \Sref{ssec:intervals below} and polyhedra.

[2.15063]

[13.2525]

intervals (see \Sref{ssec:intervals} below and polyhedra.

Replacement in ch2_preliminaries.tex at line 311 [4.8115]

B:BD[13.2526] → [2.15123:15338]

An octagon can be described by a set of constraints of the form $\pm v_i \pm v_j
\leq b$\cite{mine2001wcre}. Obviously, such constraints are linear constraints
and hence octagons are a specialization of polyhedra.

[13.2526]

[2.15338]

\begin{definition}\label{def:octagons}
    $\mathcal{P} \subseteq \R^n$ is an octagon if and only if it can be
    expressed by an a set of constraints of the form $\pm v_i \pm
    v_j \leq b$\cite{mine2001wcre}. 
\end{definition}

Replacement in ch2_preliminaries.tex at line 317 [4.8115]

B:BD[2.15339] → [2.15339:15604]

Octagons are used in \gls{koat} during the computation of invariants. They are
faster to work with than polyhedra but less precise. \todo{cite runtime for
various operations} As shown in \Sref{sec:invariant}, too wide constraints are
not a problem for invariants.

[2.15339]

[2.15604]

Obviously, such constraints are linear constraints and hence octagons are a
specialization of polyhedra. Octagons are used in \gls{koat} during the
generation of invariants. They are faster to work with than polyhedra but less
precise.

Replacement in ch2_preliminaries.tex at line 322 [4.8115]

B:BD[2.15605] → [2.15605:15724]

\subsection{Intervals}\label{ssec:intervals}
For completes sake, let's introduce a third abstract domain: the interval

[2.15605]

[2.15724]

\subsection{Intervals}\label{ssec:box}
For completeness sake, let's introduce a third abstract domain: the interval

Replacement in ch2_preliminaries.tex at line 328 [4.8115]

B:BD[2.15893] → [2.15893:16009]

\begin{definition}[Box]
    $mathcal{B} \subseteq \R^n$ is a box if it can be expressed by a set of
    intervals.

[2.15893]

[2.16009]

\begin{definition}[Box]\label{def:box}
    $\mathcal{P} \subseteq \R^n$ is a box if it can be expressed by a set of
    intervals.

Replacement in ch2_preliminaries.tex at line 333 [4.8115]

B:BD[2.16027] → [2.16027:16397]

By construction every Box is an octagon and in turn a polyhedron. For every
polyhedron $P$ one can find a box $B$ that includes the polyhedron. Whenever
it's acceptable to arbitrarily widen the polyhedron, one can work with boxes
instead. Boxes are computationally very efficient, although rather imprecise,
for most applications.\todo{beautify}
\todo{example picture}

[2.16027]

[2.16397]

By construction every box is an octagon and in turn a polyhedron. For every
polyhedron $P$ one can find a box $P'$ that contains the polyhedron
$P$.\todo{citation or proof} 
Whenever it's acceptable to arbitrarily widen the
polyhedron, one can work with boxes instead. Boxes are computationally very
efficient, although rather imprecise, for most applications.

Deletion in ch2_preliminaries.tex at line 340 [4.8115]
B:BD[2.16398] → [2.16398:16422]
```
\subsection{Operations}
```

Replacement in ch2_preliminaries.tex at line 351 [4.8115]

B:BD[11.1244] → [11.1244:1282]

\begin{definition}[Probability space]

[11.1244]

[11.1282]

Imagine probabilistic event with some possible outcomes $\Omega$. For example a 
coin-toss can have arbitrary many outcomes when taking the position on the table
into account, the fact that the coin might get lost in the process etc. 
A probability measure describes the probabilities of sets of random outcomes.
For example the coin-toss on the table has a sub-set of outcomes where the
coin's head is above. The probability measure would assign a probability close
to 50\% for a somewhat normal coin-toss. 
Formally a probability measure is defined on a $\sigma$-algebra which asserts
the intuitive property of random event: if you can measure two subsets of
outcomes (e.g. $A = \set{ \omega \in \Omega} {\text{ coin shows head}}$, and $B
= \set{\omega \in \Omega} {\text{coin shows tail}}$) so you can for both subsets
together ($A \union B = \set{\omega \in \Omega} {\text{coin shows head or
tails}}$) and the probability of the combined outcomes is equal to the sum of
the individual outcomes.
\begin{definition}[Probability Measure]\label{def:measure}
    A set function $\mu$ on a $\sigma$-field $\F$ is a probability
    measure if it satisfies the following conditions:
    \begin{enumerate}
        \item $\mu(A)\in [0,1]$ for $A \in \F$
        \item $\mu(\emptyset) = 0$
        \item if $A_1, A_2, ...$ is a disjoint sequence of $\F$-sets then 
            \begin{equation*}
                \mu\left(\Union_{k=1}^\infty A_k \right) = \sum_{k=1}^\infty
                \mu(A_k)
            \end{equation*}
        \item $\mu(\Omega) = 1$
    \end{enumerate}
\end{definition}
A probability space describes the set of all possible outcomes $\Omega$, the
measurable sub-sets of outcomes $\F$ and the probability $P$ of those measurable
outcomes.
\begin{definition}[Probability space]\label{def:probability_space}

Deletion in ch2_preliminaries.tex at line 404 [4.8115]

B:BD[11.2230] → [11.2230:2258]

B:BD[11.2258] → [12.2978:3051]

∅:D[12.3051] → [11.2332:2577]

B:BD[11.2332] → [11.2332:2577]

            \end{enumerate}
        \item $P$ assigns a probability to every event and satisfies the
            following conditions:
            \begin{enumerate}
                \item $0 \leq P(A) \leq 1$ for $A \in \F$,
                \item $P(\emptyset) = 0$, and $P(\Omega) = 1$,
                \item $ $\todo{invariance of permutation.}

Replacement in ch2_preliminaries.tex at line 405 [4.8115]

B:BD[11.2605] → [11.2605:2625]

B:BD[11.2625] → [12.3052:3116]

∅:D[12.3116] → [11.2690:2707]

B:BD[11.2690] → [11.2690:2707]

∅:D[11.2707] → [4.9303:9304]

B:BD[4.9303] → [4.9303:9304]

B:BD[4.9304] → [13.2867:3399]

    \end{enumerate}
            \todo{Refer to a definition of a $\sigma$-algebra.}
\end{definition}
\begin{definition}[Measure]
    A set function $\mu$ on a $\sigma$-field $\F$ in $\Omega$ is a probability
    measure if it satisfies the following conditions:
    \begin{enumerate}
        \item $\mu(A)\in [0,1]$ for $A \in \F$
        \item $\mu(\emptyset) = 0$
        \item if $A_1, A_2, ...$ is a disjoint sequence of $\F$-sets then 
            \begin{equation*}
                \mu\left(\Union_{k=1}^\infty A_k \right) = \sum_{k=1}^\infty
                \mu(A_k)
            \end{equation*}
        \item $\mu(\Omega) = 1$

[11.2605]

[13.3399]

        \item $P$ assigns a probability to every set in $\F$ and is a
            probability measure.

Replacement in ch2_preliminaries.tex at line 415 [4.8115]
B:BD[11.3025] → [11.3025:3061]
```
\begin{definition}[Random variable]
```
[13.3961]
[8.21727]
```
\begin{definition}[Random variable]\label{def:random_variable}
```

Replacement in ch2_preliminaries.tex at line 421 [4.8115]

B:BD[13.4225] → [8.21906:22131]

In the following, we will only consider discrete random variables $X : \Omega
\rightarrow \Z$ with countably (but possibly infinitely) many possible results,
since only discrete random variables are relevant for this thesis.

[13.4225]

[11.3124]

In the following, we will encounter discrete random variables $X : \Omega
\rightarrow \Z$ with countably (but possibly infinitely) many possible results.

Replacement in ch2_preliminaries.tex at line 426 [4.8115]

B:BD[8.22287] → [8.22287:22366]

sufficient to fully describe them. The underlying event space $\Omega$ becomes

[8.22287]

[8.22366]

sufficient to fully describe them. The underlying probability space becomes

Replacement in ch2_preliminaries.tex at line 431 [4.8115]

B:BD[14.1] → [8.22557:22611]

\begin{definition}[Distribution of a random variable]

[14.1]

[8.22611]

\begin{definition}[Distribution of a random variable]\label{def:distribution}

Replacement in ch2_preliminaries.tex at line 460 [4.8115]

B:BD[11.4151] → [8.23754:23811]

\subsection{Bernoulli Distribution}\label{sec:bernoulli}

[11.4151]

[8.23811]

\subsection{Bernoulli Distribution}\label{ssec:bernoulli}

Replacement in ch2_preliminaries.tex at line 463 [4.8115]
B:BD[8.23934] → [8.23934:23977]
```
\begin{definition}[Bernoulli Distribution]
```
[8.23934]
[8.23977]
```
\begin{definition}[Bernoulli Distribution]\label{def:bernoulli}
```
Replacement in ch2_preliminaries.tex at line 478 [4.8115]
B:BD[11.4426] → [8.24394:24447]
```
\subsection{Uniform Distribution}\label{sec:uniform}
```
[11.4426]
[8.24447]
```
\subsection{Uniform Distribution}\label{ssec:uniform}
```
Replacement in ch2_preliminaries.tex at line 482 [4.8115]
B:BD[8.24555] → [8.24555:24574]
```
\begin{definition}
```
[8.24555]
[8.24574]
```
\begin{definition}\label{def:uniform}
```
Replacement in ch2_preliminaries.tex at line 498 [4.8115]
B:BD[8.25083] → [8.25083:25119]
```
\subsection{Geometric distribution}
```
[8.25083]
[8.25119]
```
\subsection{Geometric distribution}\label{ssec:geom}
```
Replacement in ch2_preliminaries.tex at line 503 [4.8115]
B:BD[8.25350] → [8.25350:25369]
```
\begin{definition}
```
[8.25350]
[8.25369]
```
\begin{definition}\label{def:geom}
```
Replacement in ch2_preliminaries.tex at line 517 [4.8115]
B:BD[8.25812] → [8.25812:25853]
```
\subsection{Hypergeometric Distribution}
```
[8.25812]
[8.25853]
```
\subsection{Hypergeometric Distribution}\label{def:hyper}
```
Replacement in ch2_preliminaries.tex at line 541 [4.8115]
B:BD[8.26834] → [8.26834:26876]
```
\begin{definition}[Binomial Distribution]
```
[8.26834]
[8.26876]
```
\begin{definition}[Binomial Distribution]\label{def:bino}
```

Insertion in ch2_preliminaries.tex at line 584 [4.8115]

[8.28325]

[4.9304]

\subsection{Polynomials over distributions}
\todo{define support, and constraints}

Deletion in ch2_preliminaries.tex at line 588 [4.8115]
B:BD[4.9345] → [10.5145:5198]
```
\newacronym{pip}{PIP}{Probabilistic Integer Program}
```
Insertion in ch2_preliminaries.tex at line 595 [4.8115]
[11.4731]
[3.37062]

Replacement in ch2_preliminaries.tex at line 599 [4.8115]

B:BD[14.160] → [14.160:187]

integer transition system.

[14.160]

[4.9612]

integer transition system. Before giving a formal definition of probabilistic
integer programs the various concepts of integer programs are introduced
intuitively in a less formal way.

Replacement in ch2_preliminaries.tex at line 603 [4.8115]

B:BD[4.9691] → [14.188:393]

∅:D[14.393] → [4.9927:10006]

B:BD[4.9927] → [4.9927:10006]

B:BD[4.10006] → [14.394:619]

between those locations. A run of the program is a sequence of configurations --
that is a location and a state -- where every configuration is reachable via a
transition from the previous configuration. 
Non-deterministic programs have mutually non-exclusive transitions leaving the
same location. Hence it is unclear which transition is taken at runtime. The
decision is made by a scheduler. Also guards and assignments of the transition 
might depend on temporary variables that are not set by the state.

[4.9691]

[14.619]

between those locations. A run of a program is a sequence of configurations,
where every configuration contains the location at which the program is and a
state that holds the current values of the program variables. A transition
contains conditions, called \textit{guard}, that must be true for the current
state to be taken. Whenever a transition is taken it can modifies the state with
some updates. An update assigns a new value to a program variable depending on
the previous state. Ever inter program starts at a unique location usually
called $l_0$. Whenever no transition guard is satisfied the program terminates.

Replacement in ch2_preliminaries.tex at line 612 [4.8115]

B:BD[14.620] → [8.28326:28341]

\todo{example}

[14.620]

[14.638]

Non-deterministic programs contain mutually non-exclusive transitions leaving the
same location. Hence it is unclear which transition is taken at runtime.

Replacement in ch2_preliminaries.tex at line 615 [4.8115]

∅:D[14.639] → [4.10178:10442]

B:BD[4.10178] → [4.10178:10442]

B:BD[4.10442] → [3.37142:37444]

Probabilistic programs are similar to non-determistic ones, but the transition
taken is decied on a probabilistic basis. Imagine an oracle that throws some
dice to determin the taken transition. 
In order to allow both concepts in a program, we use the concept of
\textit{general transitions}: they are sets of (conventional) transitions with
the probabilities adding up to 1, acting as a single transition for the
resolution of non-determinism. Non-determinism can only occur between general
transitions and it is resolved first before probabilities are resolved.

[14.639]

[4.10729]

\begin{example}\label{ex:nd_branching}
    \begin{figure}[h]
        \centering
        \input{figures/ch2_ex_pip_nd.tex}
        \caption{A non-deterministic integer program over the variables $\V =
        \{x\}$.\label{fig:ex_pip_nd}}
    \end{figure}

Replacement in ch2_preliminaries.tex at line 623 [4.8115]

B:BD[4.10730] → [3.37445:37651]

Deterministic and non-probabilistic programs are a special case of probabilistic
programs, where every general transition consist of a single transition and all
general transitions are mutually exclusive.

[4.10730]

[4.10935]

    Take the program displayed in \fref{fig:ex_pip_nd} for example. At location
    $l_1$ with the state $\sigma(x) = 3$ both transitions $t_2$ and $t_3$ are
    possible, since both of their guards $x > 0$ and $x > 1$ are satisfied. At
    runtime the decision which transition is taken is arbitrary
    (non-determistic). 
\end{example}

Replacement in ch2_preliminaries.tex at line 630 [4.8115]

B:BD[4.10936] → [3.37652:38150]

This thesis will closely follow the definitions of F. Meyer \cite{https://link.springer.com/chapter/10.1007/978-3-319-66167-4_8}.
For the following the set of all variables is split into the program variables
$\PV$ and temporary variables $TV$. Program variables are assigned at the start
of a program and can get values assigned during the run of a program, wheras
temporary variables are only existentially quantified for every transition.
Hence, they do not \enquote{carry over} between states.

[4.10936]

[4.11085]

A similar concept to non-determinism (where the decision is fully arbitrary), is
to give a probability to each transition. Instead of picking the transition
fully arbitrarily, the transitions are picked with the respective probability.
Although similar, non-deterministic and probabilistic branching treated
separately. In order to allow both concepts in a program, one introduces the 
concept of \textit{general transitions}: they are sets of (conventional)
transitions with the probabilities adding up to 1, acting as a single transition
for the resolution of non-determinism. Non-determinism can only occur between
general transitions and it is resolved first before probabilities are resolved,
and every transition in a general transition must have the same guard.

Replacement in ch2_preliminaries.tex at line 641 [4.8115]

B:BD[4.11086] → [4.11086:11137]

\begin{definition}[Probabilistic Integer Program]

[4.11086]

[3.38151]

\begin{example}\label{ex:prob_branching}
    \begin{figure}[h]
        \centering
        \input{figures/ch2_ex_pip_prob.tex}
        \caption{A probabilistic (and non-deterministic) integer program over
        the variables $\V= \{x\}$. \label{fig:ex_pip_prob}}
    \end{figure}
    Take the program displayed in \fref{fig:ex_pip_prob} for example. The
    transitions $t_2$ and $t_3$ are part of a general transition (marked in
    red). For simplicity, all other transitions are unique members of their own
    general transition and the trivial probability of 1 is omitted. 
    At location $l_1$ with a variable assignment $\sigma(x) = 3$ three
    transitions $t_2$, $t_3$ and $t_4$ are possible. The non-determinism is
    resolved first 
\end{example}
Besides probabilistic branching, variable assignments can be non-deterministic
or probabilistic, which is also called non-deterministic or probabilistic
sampling. Non-deterministic sampling occurs when on a transition a variable is
updated to an expression that contains unbound variables (variables that are not
assigned a value in the previous state). The unbound variables are sampled
arbitrarily from all the integers, but can be constraint by the guard, in which
case the transition is only taken if the non-deterministic sampling fulfills the
guard. If the sampled value fulfills no transition's guard it means the program
terminates. Non-deterministic sampling is resolved before the non-deterministic
branching.
\begin{example}\label{ex:nd_sampling}
    \begin{figure}[h]
        \centering
        \input{figures/ch2_ex_pip_nds.tex}
        \caption{A integer program with non-deterministic sampling over
        the variables $\V= \{x, t\}$ with program variables $\PV=\{x\}$.
        \label{fig:ex_pip_nds}}
    \end{figure}
    Take the program displayed in \fref{fig:ex_pip_nds} for example. The
    transition $t_2$ contains an update with a temporary $t$ variable.
    Furthermore, the temporary variable is constraint to $1 \leq t \leq 3$.
    Since the temporary variable $t$ is not bound in the state $\sigma: \PV
    \rightarrow \Z$, the variable can take any arbitrary value.
    Whenever temporary variable is sampled to a value not satisfying the
    guard of $t_2$ and x is larger then zero, the program would terminate.
\end{example}
Probabilistic sampling is done using probability distributions. Coincidentally,
only the probability distributions from \Sref{ssec:distributions} are supported.
Updates are restricted to integer polynomials with variables and additionally
distributions when probabilistic sampling is allowed. The value of the
indeterminate in the polynomial is equal to the (possibly temporary) variable or
sampled from the distribution with the corresponding probability. 
\begin{example}\label{ex:prob_sampling}
    \begin{figure}[h]
        \centering
        \input{figures/ch2_ex_pip_probs.tex}
        \caption{A integer program with probabilistic sampling over
        the variables $\V= \{x\}$ with program variables $\PV=\{x\}$.
        \label{fig:ex_pip_probs}}
    \end{figure}
    Take the program depicted in \fref{fig:ex_pip_probs} for example. In
    transition $t_2$, the variable x is assigned to the polynomial $x -
    \textsc{Bern}(0.5)$. The value of the Bernoulli distribution can take the
    value of 1 or 2 with a probability of 0.5 in both cases. In case that the
    distribution is sampled to 1, the variable x is decremented, and stays the
    same otherwise. 
\end{example}
Deterministic non-probabilistic programs are a special case of probabilistic
programs, where every general transition consist of a single transition, all
general transitions are mutually exclusive, and no non-deterministic or
probabilistic sampling is done in the transitions. Similarly non-deterministic
non-probabilistic programs are a special case of probabilistic programs where
every general transition contains only a single transition and no probabilistic
sampling is allowed. 
This thesis will closely follow the formal definitions of E. Meyer
\cite{meyer2021tacas}. First the formal definition for a probabilistic program
is given, then the semantics are introduced.
\begin{definition}[Probabilistic Integer Program]\label{def:pip}

Replacement in ch2_preliminaries.tex at line 728 [4.8115]

B:BD[4.11716] → [4.11716:11760]

            $t = (l, p, τ, η, l')$ with:

[4.11716]

[4.11760]

            $t = (l, p, \tau, \eta, l')$ with:

Replacement in ch2_preliminaries.tex at line 731 [4.8115]

B:BD[4.11856] → [4.11856:12054]

B:BD[4.12054] → [3.38287:38363]

∅:D[3.38363] → [11.4807:5017]

B:BD[11.4807] → [11.4807:5017]

                \item a probability $p \geq 0$, that the transition is taken when 
                    the correspondig general transition $g$ is executed. 
                \item a guard $τ \in C$
                \item an update function $η : \PV \mapsto \Z[\PV] \cup D$,
                    mapping every program variable to a polynomial or a bounded
                    distribution function. All $t \in g$ must share the same
                    start location $l$, guard $τ$.

[4.11856]

[4.12342]

                \item a probability $p \geq 0$, that the transition is taken
                    when the corresponding general transition $g$ is executed. 
                \item a guard $\tau \in C$
                \item an update function $\eta : \PV \mapsto \Z[\V \cup D]$,
                    mapping every program variable to an integer polynomial
                    containing variables or a distribution functions. All $t \in
                    g$ must share the same start location $l$, guard $τ$.

Deletion in ch2_preliminaries.tex at line 744 [4.8115]

B:BD[4.12643] → [4.12643:12661]

B:BD[4.12661] → [3.38364:38478]

B:BD[3.38478] → [14.640:707]

∅:D[14.707] → [3.38478:38890]

B:BD[3.38478] → [3.38478:38890]

∅:D[3.38890] → [11.5035:5036]

B:BD[11.5035] → [11.5035:5036]

B:BD[11.5036] → [3.38891:38915]

∅:D[3.38915] → [11.5213:5425]

B:BD[11.5213] → [11.5213:5425]

B:BD[11.5425] → [3.38916:38962]

∅:D[3.38962] → [11.5755:5756]

B:BD[11.5755] → [11.5755:5756]

B:BD[11.5822] → [11.5822:5942]

B:BD[11.5942] → [14.708:987]

∅:D[14.987] → [11.5942:6680]

B:BD[11.5942] → [11.5942:6680]

\end{definition}
\todo{examples}
\begin{figure}\label{fig:pip1}
    \caption{A simple probabilistic integer program.}
\end{figure}
Let's recap the semantics of a probabilistic integer program. 
\fref{fig:pip1} gives an example for a very simple probabilistic integer
program. 
\todo{give an example for temporary variables}
Unsurprisingly, a PIP is executed starting at the start location with a given
assignment $\sigma_0 : \PV \rightarrow \N$. A pair of location and assignment
$(l, \sigma) \in \L \times \Sigma$ is called a configuration and represents
specific state of a program during an execution.
Given a configuration 
assignment for the program variables (the input to the program), the program 
is evaluated starting from the start location $l_0$. 
An execution path of a program is a sequence of configurations, where the first
configuration is the starting configuration. 
The curent configuration is represented as a tuple $(l_0, c_0)$. 
An execution path is a sequence of configurations. 
\subsection{Non-deterministic and probabilistic branching and assignments}
\begin{comment}
    - Probabilistic branching
    - Non-determinstic branching
    - probabilistic assignments (via branching)
    - non-deterministic assignments (via temporary variables)
\end{comment}
\subsection{Runtime}
\begin{comment}
    for a transition:
    - constant cost
    - most simple case cost = 1 for every transition
    - combining transitions and adding costs
    - costs depending on variables
    for a prefix:
    - finite sequence of configurations
    - runtime = sum of all costs over all steps in the prefix
    - probability = product over all transition probabilities in the prefix
    - legal prefix = non-zero probability
    for a path:
    - infinite sequence of configurations
    - runtime = runtime of the largest non-zero probability prefix
    - pro
    legal paths = paths with a non-zero 
    for a program:
    - supremum over runtime of all paths
\end{comment}
\begin{definition}[Runtime of a run]

Deletion in ch2_preliminaries.tex at line 745 [4.8115]

B:BD[11.6697] → [11.6697:6835]

∅:D[11.6835] → [4.12784:12920]

B:BD[4.12784] → [4.12784:12920]

B:BD[4.12920] → [11.6836:6912]

∅:D[11.6912] → [4.12994:13047]

B:BD[4.12994] → [4.12994:13047]

B:BD[4.13047] → [3.38963:39631]

∅:D[3.39631] → [4.13047:13048]

B:BD[4.13047] → [4.13047:13048]

B:BD[4.13048] → [3.39632:39931]


\begin{definition}[Worst-case runtime of a Program]
\end{definition}
\begin{definition}[Expected runtime of a Program]
\end{definition}
Various languages exist to represent integer programs in a computer readable
form; namely Koat2\cite{}, IntC, Some weird XML Onthology
% \cite{https://raw.githubusercontent.com/TermCOMP/TPDB/master/xml/xtc.xsd}
% - CINT
% - Koat Format 
% For probabilistic: PIP 
During this thesis we will transform programs. The goal is to find equivalent
programs that are easier to analyize by Koat2. But what does equivalence mean?
On non probabilistic programs one would expect, that while beeing structurally
different, the outcome of the new program is the same as the old one.
In addition the new program should take the same time as the old one. Since
costs are represented as a variable, this is part of the outcome. But the
runtime of a program is calculated by ranking-functions and they count the
number of visits to a location. In order for the runtime to be the same, bounds
shall remain the same. \todo{doesn't realy make sence!}
In probabilistic programs, a the run is non-deterministic and hence calculating
the runtime is impossible. Instead we have expected runtime-bounds. So the new
program should have the same expected runtime-bounds and the same expected
costs, as the old program. Let's give a more formal definition.

Replacement in ch2_preliminaries.tex at line 746 [4.8115]

B:BD[3.39932] → [3.39932:40199]

\begin{definition}[Program equivalence]
    Given two PIP $P = (\V, L, \GT, l_0)$ and $P' = (\V, L', \GT', l_0)$
    are equivalent if and only if the following properties hold:
    \begin{enumerate}
        \item \todo{continue}
    \end{enumerate}
\end{definition}

[3.39932]

[3.40199]

\subsection{Strongly connected components}
A given \gls{pip} induces two relations. The first one being the relation if a
transition exists from one location to another and the other one describes if a
path exists from one location to another.

Deletion in ch2_preliminaries.tex at line 751 [4.8115]

∅:D[3.40200] → [11.6913:6930]

B:BD[4.13048] → [11.6913:6930]

B:BD[11.6930] → [12.3971:4146]

\subsection{SCC}
\todo{remark: the following relations do not consider the satisfiability but
only the mere existence of transitions.}
For the following let $P=(\V, L, GT, l_0)$ be \gls{pip}.

Replacement in ch2_preliminaries.tex at line 758 [4.8115]
B:BD[12.4451] → [12.4451:4486]
```
\begin{definition}[Path relations]
```
[12.4451]
[12.4486]
```
\begin{definition}[Path relation]
```
Replacement in ch2_preliminaries.tex at line 772 [4.8115]
B:BD[12.5098] → [12.5098:5112]
```
\begin{rem}\ 
```
[12.5098]
[12.5112]
```
\begin{rem} 
```

Insertion in ch2_preliminaries.tex at line 794 [4.8115]

[12.6132]

[11.6930]

\begin{rem}
    The transition and path relation describe the mere existens of transitions
    and not if the transition is at all walkable. 
\end{rem}

Insertion in ch2_preliminaries.tex at line 874 [4.8115]

[12.9320]


\subsection{Semantics}
\todo{open question regarding temporary variables} 
% the original definition alled states defining variables, but this let's
% temporary variables carry-over to the next transition. Is this what we
% want?
Before defining the semantics of a \gls{pip} a new special location $l_\bot$ is
introduced that will be used to indicate the termination of a program as well as
a virtual transition $t_\bot$ and general transition $gt_\bot = \{t_\bot\}$ with
the same purpose. Instead of just vaguely \enquote{terminating} a program takes
the transition $gt_\bot$ to the location $l_\bot$ if and only if no other
transition is walkable. Since no normal transition leaves the location $l_\bot$
the run loops indefinitely on the location $l_\bot$ after termination. In
addition a new transition $t_\text{in}$ will be used for the start of the
program. 
A state $s$ is a variable assignment for the variables of a program $s: \V
\rightarrow \Z$. \Sigma is the set of all states. The set of configuration is
defined as $\confs = L \union \{l_\bot\} \times \T \union \{t_{\text{in}},
t_\bot\} \times \Sigma$. 
Note that additionally to the location and state, the last transition taken to
the current location is captured as well. This won't be relevant for the partial
evaluation but is important to define the probabilistic properties of a
\gls{pip}. 
A run of the program is an \textit{infinite} sequence of configurations, and the
set of all runs is defined as $\runs = \confs^\omega$. In contrast a finite
prefix is a finite sequence of configurations. The set of all finite prefixes is
defined as $\fpath = \confs^*$. 
\begin{rem} 
    The set of configurations does not exclude invalid combinations of
    locations and transitions, that is a configuration with a location that is
    not the target of the incoming transition, or a state that is impossible to
    reach via the incoming transition. Conversely, the set of runs and finite
    prefixes does not exclude invalid paths, e.g. two consecutive configurations
    that cannot be reached via the given transition, etc. The validity of a path
    will be described by a probability measure where invalid paths have a zero
    probability. 
\end{rem}
For a \gls{pip} one can define a $(\runs, \F, \textit{pr})$. The outcomes of
the probabilistic event in this space are the runs on the program. Every
distinct run is measurable hence the $\sigma$-algebra $\F$ is defined to contain
every set ${r} \in \F$ for $r \in \runs$. The probability measure $pr$ describes
the probability of the given runs. Formally the probability space is defined by
a cylindrical construction \todo{elaborate}. Since the construction is rather
involved we will only sum up and the properties relevant to this thesis.
First the probability of a run is separate from the non-determinism. So for all
the considerations the non determinism is assumed to be decided by a scheduler
and the probability measure depends on the scheduler. 
The probability of specific run in the probability space is equal to the
probability that every transition in the run is taken. Naturally, invalid
transitions (either because they do not exist in the program, or because the
guard is not satisfied) have a zero probability. 
The probability space will be used to define the semantics of a \gls{pip}
\subsection{Notes about the probability measure}
Probability that a variable $x$ takes the value $s(x)$ when taking the
transition $t$ from an (non-deterministically resolved) assignment $\tilde{s}$: 
\todo{redefine with polynomials over indeterminates}
\begin{align}
    q_{\tilde{s},t,s(x)}(x)
\end{align}
(Trivial) probability that the temporary variables got assigned there expected
values, given a (non-deterministically resolved) assignment $\tilde{s}$ and the
resulting assignment $s$
\begin{align}
    \delta_{\tilde{s}(u),s(u)})
\end{align}
Probability of a transition after a finite prefix: For $F = \dots (l', t', s') \in \fpath$, $(l, t,
x) \in \confs$, $t = (l', p, \tau, \eta, l)$.
\begin{align}
    pr_{\mathfrak{S},s_0}((l', t',s') \rightarrow (l, t, s)) :=
    pr_{\mathfrak{S},s_0}(f \rightarrow (l,t,s))=  p \cdot \prod_{x\in\PV}
    q_{\tilde{s},t,s(x)}(x) \cdot \prod_{u \in \TV} \delta_{\tilde{s}(u),s(u)})
\end{align}
\begin{rem}
    The probability depends on the scheduler $\mathfrak{S}$ and the starting
    state $s_0$. 
\end{rem}
Probability of a finite prefix. For $f = c_0, \dots, c_n \in \fpath$:
\begin{align}
    pr_{\mathfrak{S},s_0}(f) = pr_{\mathfrak{S},s_0}(c_0) \cdot \prod_{i=1}^n pr_{\mathfrak{A},s_0}(c_{i-1} \rightarrow c_i)
\end{align}
Cylindrical construction yields the unique probability measure
$\mathbf{P}_{\mathfrak{S},s_0} : \F \rightarrow [0,1]$ for infinite runs
\subsection{Runtime}
\begin{comment}
    for a transition:
    - constant cost
    - most simple case cost = 1 for every transition
    - combining transitions and adding costs
    - costs depending on variables
    for a prefix:
    - finite sequence of configurations
    - runtime = sum of all costs over all steps in the prefix
    - probability = product over all transition probabilities in the prefix
    - legal prefix = non-zero probability
    for a path:
    - infinite sequence of configurations
    - runtime = runtime of the largest non-zero probability prefix
    - pro
    legal paths = paths with a non-zero 
    for a program:
    - supremum over runtime of all paths
\end{comment}
\begin{definition}[Runtime of a run]
\end{definition}
\begin{definition}[Worst-case runtime of a Program]
\end{definition}
\begin{definition}[Expected runtime of a Program]
\end{definition}
% Various languages exist to represent integer programs in a computer readable
% form; namely Koat2\cite{}, IntC, Some weird XML Onthology
% \cite{https://raw.githubusercontent.com/TermCOMP/TPDB/master/xml/xtc.xsd}
% - CINT
% - Koat Format 
% For probabilistic: PIP 
% During this thesis we will transform programs. The goal is to find equivalent
% programs that are easier to analyze by Koat2. But what does equivalence mean?
% On non probabilistic programs one would expect, that while beeing structurally
% different, the outcome of the new program is the same as the old one.
% In addition the new program should take the same time as the old one. Since
% costs are represented as a variable, this is part of the outcome. But the
% runtime of a program is calculated by ranking-functions and they count the
% number of visits to a location. In order for the runtime to be the same, bounds
% shall remain the same. \todo{doesn't realy make sence!}
% In probabilistic programs, a the run is non-deterministic and hence calculating
% the runtime is impossible. Instead we have expected runtime-bounds. So the new
% program should have the same expected runtime-bounds and the same expected
% costs, as the old program. Let's give a more formal definition.

Deletion in ch2_preliminaries.tex at line 1026 [4.8115]

B:BD[4.13085] → [4.13085:13241]

\newacronym{lrf}{LRF}{Linear Ranking Function}
\newacronym{prf}{PRF}{Polynomial Ranking Function}
\newacronym{mprf}{M\Phi{}RF}{Multiphase Ranking Function}

Replacement in ch2_preliminaries.tex at line 1027 [4.8115]

B:BD[4.13242] → [4.13242:13409]

Ranking functions are a widely use tool to prove termination and runtime-bounds of integer transition systems. The simplest variant of ranking functions are \gls{lrf}

[4.13242]

[4.13409]

% Ranking functions are a widely use tool to prove termination and runtime-bounds of integer transition systems. The simplest variant of ranking functions are \gls{lrf}

Replacement in ch2_preliminaries.tex at line 1029 [4.8115]

B:BD[4.13410] → [4.13410:13792]

We seek a function $f(x_1,\dots,x_n) = a_1x_1 + \cdots + a_nx_n + a_0$ with the rationals as a co-domain, such that 
\begin{enumerate} 
    \item $f(\bar{x}) \leq 0$ for any valuation $\bar{x}$ that satisfies the loop constraints;
    \item $f(\bar{x}) - f(\bar{x}') \geq 1$ for any transition leadtion from $\bar{x}$ to $\bar{x}'$
\end{enumerate}
\cite{benamram2017}\todo{plagiat}

[4.13410]

[4.13792]

% We seek a function $f(x_1,\dots,x_n) = a_1x_1 + \cdots + a_nx_n + a_0$ with the rationals as a co-domain, such that 
% \begin{enumerate} 
%     \item $f(\bar{x}) \leq 0$ for any valuation $\bar{x}$ that satisfies the loop constraints;
%     \item $f(\bar{x}) - f(\bar{x}') \geq 1$ for any transition leadtion from $\bar{x}$ to $\bar{x}'$
% \end{enumerate}
% \cite{benamram2017}\todo{plagiat}
% Intuition: The ranking function decreases for every walkable transition. If such a ranking function exists, the loop terminates. \todo{not sure about this, guess}
% \section{Lexicographic ranking functions}
% We expand the \gls{lrf} to a tuple of \gls{lrf}. Where whenever lexicograpically higher function decreases lower ones can increase again.

Replacement in ch2_preliminaries.tex at line 1041 [4.8115]

B:BD[4.13793] → [4.13793:13956]

Intuition: The ranking function decreases for every walkable transition. If such a ranking function exists, the loop terminates. \todo{not sure about this, guess}

[4.13793]

[4.13956]

% Example for a tuple.

Replacement in ch2_preliminaries.tex at line 1043 [4.8115]

B:BD[4.13957] → [4.13957:14137]

\section{Lexicographic ranking functions}
We expand the \gls{lrf} to a tuple of \gls{lrf}. Where whenever lexicograpically higher function decreases lower ones can increase again.

[4.13957]

[4.14137]

% $$
% \langle f_1, f_2\rangle \text{s. th.}
% $$

Replacement in ch2_preliminaries.tex at line 1047 [4.8115]
B:BD[4.14138] → [4.14138:14160]
```
Example for a tuple. 
```
[4.14138]
[4.14160]
```
% \section{Multiphase-ranking Functions}
```

Replacement in ch2_preliminaries.tex at line 1049 [4.8115]

B:BD[4.14161] → [4.14161:14205]

$$
\langle f_1, f_2\rangle \text{s. th.}
$$

[4.14161]

[4.14205]

% \section{Goal}
% Transform a program into an equivalent program. \todo{define equivalence of
% programs}

Deletion in ch2_preliminaries.tex at line 1053 [4.8115]
B:BD[4.14208] → [4.14208:14247]
```
\section{Multiphase-ranking Functions}
```

Replacement in ch2_preliminaries.tex at line 1054 [4.8115]

B:BD[4.14248] → [4.14248:14263]

B:BD[4.14263] → [11.6973:7059]

\section{Goal}
Transform a program into an equivalent program. \todo{define equivalence of
programs}

[4.14248]

[11.7059]

\begin{comment}
- Term Rewrite Systems (TRS)
- Transition Systems
    - A set of States S
    - A start location S_0 \in S
    - A set of transitions T \in S x C x S

Insertion in ch2_preliminaries.tex at line 1061 [4.8115]
[11.7060]
[11.7060]
```
- Integer Transition Systems (ITS)
```

Insertion in ch2_preliminaries.tex at line 1063 [4.8115]

[11.7061]

Koat2 can work on integer programs with polynomial integer
arithmetic.\cite{Brockschmidt16} To represent states and invariants in such a
program, one needs polynomial constraints. As an extended concept Koat2 uses
boxes and we will use polyhedra for the partial evaluation. Since those concepts
are closely related we will introduce them together. 
\end{comment}

Replacement in ch1_introduction.tex at line 7 [4.14309]

B:BD[9.7642] → [9.7642:8486]

is strongly related to the question upper and lower runtime bounds, or the
runtime complexity of a program, is equally non-computable. Nevertheless, the
answers to those questions are very important, since proven termination or small
runtime-complexities are generally desirable in practice. For example a compiler
might want to warn the programmer about faulty code sections that were not
marked explicitly to run indefinitely, or the developer could be forced to prove
the efficiency of his program in critical scenarios. In an ever more complex
world, with ever more complex algorithms, the need for automatic tools arised.
Even though the question for runtime-complexity can not be answered in a general
case, many tools were developed to automatically analyze the complexity of
various programming paradigms as tight and fast as possible.

[9.7642]

[9.8486]

is strongly related to the search for upper and lower runtime bounds, or the
runtime complexity of a program, is equally undecidable. Nevertheless, the
answers to those questions are very important in practice. For example a
compiler might want to warn the programmer about faulty code sections that were
not marked explicitly to run indefinitely, or the developer could be forced to
prove the efficiency of his program in critical scenarios. In an ever more
complex world, with ever more complex algorithms, the need for automatic tools
arised. Even though the question for runtime-complexity can not be answered in a
general case, many tools were developed to automatically analyze the complexity
of various programming paradigms as tight and fast as possible.

Replacement in ch1_introduction.tex at line 43 [4.14309]

B:BD[9.10156] → [9.10156:10662]

runtime-complexity and size bounds on integer transition systems. At its core,
KoAT iteratively computes ranking \todo{be more precise}functions to prove upper
bounds, alternating between size and runtime-bounds and thus leveraging the
relation between both to get tight results. Optionally to improve the analysis,
KoAT resorts to refinement techniques, like \gls{mprf} and
\gls{cfr}\cite{giesl2022lncs}. Recently, KoAT was expanded to work on
probabilistic integer programs as well\cite{meyer2021tacas}.

[9.10156]

[9.10662]

runtime-complexity and size bounds on transition systems. At its core,
KoAT computes bounds for subprograms using \gls{mprf} or \gls{twn}, and then
putting the subprograms together generate upper runtime-complexity and size
bounds for the whole program. 
Optionally to improve the analysis, Koat can resort to partial evaluation 
as a control-flow refinement techniques\cite{giesl2022lncs}. 
At first \gls{koat} was aimed at linear integer programs, but it was recently
extended to probabilistic integer programs\cite{meyer2021tacas} and
non-linear arithmetic\todo{citation needed}.

Replacement in ch1_introduction.tex at line 54 [4.14309]

B:BD[9.10688] → [9.10688:10824]

The tool iRankFinder is another tool taking part in \gls{termcomp}. It converts
\gls{its} into \gls{chc} and uses 
% Hier weiter machen

[9.10688]

[9.10824]

The tool iRankFinder\cite{irankfinder2018wst} is another tool taking part in
\gls{termcomp}. It uses linear and lexicographic ranking functions for the
analysis and the program is internally represented as \gls{chc} program, which
is very similar to integer transition systems in the regard that integer
transition systems can be transformed into equivalent \gls{chc} systems.
Control-flow refinement is a technique where a program is transformed into a
semantically equivalent program, which is easier to analyse with the existing
analysis techniques (e.g. linear, lexicographic, and multiphase ranking 
functions). The technique was put forward by \citeauthor{gulwani2009}
\cite{gulwani2009}. A typical example of such a program can be seen
in example \ref{ex:splitterloop}, where a single loop is replaced by two
independent consecutive loops. iRankFinder successfully implemented the
control-flow refinement technique by partial evaluation proposed by
\cite{gallagher2019eptcs,domenech2019arxiv}.

Replacement in ch1_introduction.tex at line 70 [4.14309]

B:BD[9.10840] → [9.10840:11861]

This thesis improves on the latest version of \gls{koat} by reimplementing the
control flow refinement technique of iRankFinder\cite{irankfinder2018wst}
natively in KoAT instead of calling an external library and adapting it to the
paradigm of probabilistic programs. The well-known basics required to understand
this thesis are recapitulated in \Sref{sec:preliminaries}, focusing especially
on constraints, probability, and (probabilistic) integer programs. In
\Sref{sec:theory} the \gls{cfr} techniques from iRankFinder are adapted to
\Gls{pip}, showing the proving the theoretical correctness of the construction.
\Sref{sec:implementation} will focus on the changes made to \gls{koat} and the
challenges met during implementation of the technique in Ocaml. Finally in
\Cref{sec:conclusion} the new version of \gls{koat} will be compared to its
predecessor with regard to the found runtime-complexity and size bounds as well
as the overall computational performance of the tool using the problems from the
\gls{tpdb}.

[9.10840]

[3.40329]

\gls{koat} borrowed the implementation of iRankFinder as a black-box which came
with a number of limitations\cite{giesl2022wst}: Besides code-quality and
performance issues, the external library wouldn't be able to profit from future
improvements to the algorithms. This thesis improves on the latest version of
\gls{koat} by reimplementing the control flow refinement technique of
iRankFinder\cite{irankfinder2018wst} natively in KoAT instead of calling the
external library and adapting it to the paradigm of probabilistic programs. 
The well-known basics required to understand this thesis are recapitulated in
\Sref{sec:preliminaries}, focusing especially on constraints, probability, and
(probabilistic) integer programs. In \Sref{sec:theory} the \gls{cfr} techniques
from iRankFinder are adapted to \Gls{pip}, showing the proving the theoretical
correctness of the construction. \Sref{sec:implementation} will focus on the
changes made to \gls{koat} and the challenges met during implementation of the
technique in OCaml. Finally in \Cref{sec:conclusion} the new version of
\gls{koat} will be compared to its predecessor with regard to the found
runtime-complexity and size bounds as well as the overall computational
performance of the tool using the problems from the \gls{tpdb}.

Insertion in acronyms.tex at line 1 [9.11899]
[9.11899]
[9.11900]
```
% TeX root = main.tex
```

Replacement in acronyms.tex at line 11 [9.11899]

B:BD[9.12351] → [9.12351:12447]

\newacronym{koat}{KoAT}{KoAT\todo{wrong acro}} 
\newacronym{loat}{LoAT}{LoAT\todo{wrong acro}}

[9.12351]

[9.12447]

\newacronym{koat}{KoAT}{Komplexitäts Analyse Tool} 
\newacronym{loat}{LoAT}{Loop Accelleration Tool}

Insertion in acronyms.tex at line 14 [9.11899]

[9.12493]

\newacronym{lrf}{LRF}{Linear Ranking Function}
\newacronym{prf}{PRF}{Polynomial Ranking Function}

Replacement in acronyms.tex at line 20 [9.11899]
B:BD[2.16509] → [2.16509:16555]
```
\newacronym{lip}{LIP}{linear integer program}
```
[2.16509]
[2.16555]
```
\newacronym{ilp}{ILP}{linear integer program}
```

Insertion in acronyms.tex at line 22 [9.11899]

[2.16591]

\newacronym{twn}{TWN}{triangular weakly non-linear loop}
\newacronym{scc}{SCC}{strongly connected component}

WIP

Dependencies

In channels

Change contents

Insertion in literature.bib at line 661 [3.18034]

Insertion in literature.bib at line 680 [3.18034]

File addition: ch2_ex_pip_probs.tex (----------)

File addition: ch2_ex_pip_prob.tex (----------)

File addition: ch2_ex_pip_nds.tex (----------)

File addition: ch2_ex_pip_nd.tex (----------)

File addition: ch2_abstract_domains_poly.tex (----------)

File addition: ch2_abstract_domains_oct.tex (----------)

File addition: ch2_abstract_domains_box.tex (----------)

Insertion in ch4_implementation.tex at line 48 [4.7792]

Insertion in ch4_implementation.tex at line 100 [4.7792]

Insertion in ch4_implementation.tex at line 107 [4.7792]

Insertion in ch4_implementation.tex at line 109 [4.7792]

Insertion in ch3_theory.tex at line 3 [4.7949]

Replacement in ch3_theory.tex at line 101 [4.7949]

Replacement in ch3_theory.tex at line 221 [4.7949]

Replacement in ch3_theory.tex at line 223 [4.7949]

Replacement in ch3_theory.tex at line 229 [4.7949]

Replacement in ch3_theory.tex at line 232 [4.7949]

Replacement in ch3_theory.tex at line 236 [4.7949]

Replacement in ch3_theory.tex at line 239 [4.7949]

Deletion in ch2_preliminaries.tex at line 4 [4.8115]

Deletion in ch2_preliminaries.tex at line 5 [4.8115]

Replacement in ch2_preliminaries.tex at line 16 [4.8115]

Replacement in ch2_preliminaries.tex at line 28 [4.8115]

Replacement in ch2_preliminaries.tex at line 36 [4.8115]

Replacement in ch2_preliminaries.tex at line 39 [4.8115]

Deletion in ch2_preliminaries.tex at line 51 [4.8115]

Replacement in ch2_preliminaries.tex at line 52 [4.8115]

Replacement in ch2_preliminaries.tex at line 57 [4.8115]

Replacement in ch2_preliminaries.tex at line 66 [4.8115]

Replacement in ch2_preliminaries.tex at line 69 [4.8115]

Replacement in ch2_preliminaries.tex at line 71 [4.8115]

Replacement in ch2_preliminaries.tex at line 86 [4.8115]

Replacement in ch2_preliminaries.tex at line 92 [4.8115]

Replacement in ch2_preliminaries.tex at line 96 [4.8115]

Replacement in ch2_preliminaries.tex at line 99 [4.8115]

Replacement in ch2_preliminaries.tex at line 106 [4.8115]

Replacement in ch2_preliminaries.tex at line 115 [4.8115]

Replacement in ch2_preliminaries.tex at line 150 [4.8115]

Replacement in ch2_preliminaries.tex at line 156 [4.8115]

Replacement in ch2_preliminaries.tex at line 164 [4.8115]

Replacement in ch2_preliminaries.tex at line 168 [4.8115]

Insertion in ch2_preliminaries.tex at line 172 [4.8115]

Replacement in ch2_preliminaries.tex at line 176 [4.8115]

Deletion in ch2_preliminaries.tex at line 262 [4.8115]

Replacement in ch2_preliminaries.tex at line 263 [4.8115]

Replacement in ch2_preliminaries.tex at line 293 [4.8115]

Insertion in ch2_preliminaries.tex at line 299 [4.8115]

Replacement in ch2_preliminaries.tex at line 309 [4.8115]

Replacement in ch2_preliminaries.tex at line 311 [4.8115]

Replacement in ch2_preliminaries.tex at line 317 [4.8115]

Replacement in ch2_preliminaries.tex at line 322 [4.8115]

Replacement in ch2_preliminaries.tex at line 328 [4.8115]

Replacement in ch2_preliminaries.tex at line 333 [4.8115]

Deletion in ch2_preliminaries.tex at line 340 [4.8115]

Replacement in ch2_preliminaries.tex at line 351 [4.8115]

Deletion in ch2_preliminaries.tex at line 404 [4.8115]

Replacement in ch2_preliminaries.tex at line 405 [4.8115]

Replacement in ch2_preliminaries.tex at line 415 [4.8115]

Replacement in ch2_preliminaries.tex at line 421 [4.8115]

Replacement in ch2_preliminaries.tex at line 426 [4.8115]

Replacement in ch2_preliminaries.tex at line 431 [4.8115]

Replacement in ch2_preliminaries.tex at line 460 [4.8115]

Replacement in ch2_preliminaries.tex at line 463 [4.8115]

Replacement in ch2_preliminaries.tex at line 478 [4.8115]

Replacement in ch2_preliminaries.tex at line 482 [4.8115]

Replacement in ch2_preliminaries.tex at line 498 [4.8115]

Replacement in ch2_preliminaries.tex at line 503 [4.8115]

Replacement in ch2_preliminaries.tex at line 517 [4.8115]

Replacement in ch2_preliminaries.tex at line 541 [4.8115]

Insertion in ch2_preliminaries.tex at line 584 [4.8115]

Deletion in ch2_preliminaries.tex at line 588 [4.8115]

Insertion in ch2_preliminaries.tex at line 595 [4.8115]

Replacement in ch2_preliminaries.tex at line 599 [4.8115]

Replacement in ch2_preliminaries.tex at line 603 [4.8115]