paradyx/ma-tex - Change GNUONJQNZG2MNEE55RW3XOQP3UICEBOKLVLKV42H3K64IBGLUGIQC

WIP

Created by paradyx on July 6, 2023

GNUONJQNZG2MNEE55RW3XOQP3UICEBOKLVLKV42H3K64IBGLUGIQC

Dependencies

In channels

main

Change contents

Insertion in literature.bib at line 781 [4.18034]

[3.3025]

}
@InCollection{barwise1977,
  author    = {Jon Barwise},
  booktitle = {HANDBOOK OF MATHEMATICAL LOGIC},
  publisher = {Elsevier},
  title     = {An Introduction to First-Order Logic},
  year      = {1977},
  editor    = {Jon Barwise},
  pages     = {5-46},
  series    = {Studies in Logic and the Foundations of Mathematics},
  volume    = {90},
  abstract  = {Publisher Summary
This chapter discusses the formulas that are certain finite strings of symbols. The “first” in the phrase “first-order logic” is to distinguish this form of logic from stronger logics, such as second-order or weak second-order logic, where certain extralogical notions (set or natural number) are taken as given in advance. The chapter provides information of what can and what cannot be expressed in first-order logic. Most of the examples are taken from the wealth of notions in modern algebra with which most mathematicians have at least a nodding acquaintance. The chapter also discusses many-sorted first-order logic, ω-logic, weak second-order logic, Infinitary logic, Logic with new quantifiers, and abstract model theory.},
  doi       = {https://doi.org/10.1016/S0049-237X(08)71097-8},
  file      = {:/home/paradyx/MA/literatur/introductiontofo.pdf:PDF},
  issn      = {0049-237X},
  url       = {https://www.sciencedirect.com/science/article/pii/S0049237X08710978},
}
@InProceedings{gurfinkel2010,
  author    = {Arie Gurfinkel and Sagar Chaki},
  booktitle = {Static Analysis - 17th International Symposium, {SAS} 2010, Perpignan, France, September 14-16, 2010. Proceedings},
  title     = {Boxes: {A} Symbolic Abstract Domain of Boxes},
  year      = {2010},
  editor    = {Radhia Cousot and Matthieu Martel},
  pages     = {287--303},
  publisher = {Springer},
  series    = {Lecture Notes in Computer Science},
  volume    = {6337},
  bibsource = {dblp computer science bibliography, https://dblp.org},
  biburl    = {https://dblp.org/rec/conf/sas/GurfinkelC10.bib},
  doi       = {10.1007/978-3-642-15769-1\_18},
  groups    = {Polyhedra, Octagons, Boxes},
  timestamp = {Mon, 03 Jan 2022 22:21:24 +0100},
  url       = {https://doi.org/10.1007/978-3-642-15769-1\_18},

File deletion: ch1_example2.tex

BF:BFD[5.7550] → [6.11881:11921]

BF:BFD[6.11921] → [6.11922:11922]

B:BD[6.11922] → [6.11923:13424]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=-3.3,
        xmax=3.3,
        ymin=0,
        ymax=5.3,
        y=1cm,
        x=1cm,
        ytick={-0,...,5},
        xtick={-3,...,3},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        \addplot [ name path = A, thick ] {x + 4};
        \addplot [ name path = B, thick ] {x + 1};
        \addplot [ name path = C, thick ] {-x + 4};
        \addplot [ name path = D, thick ] {-x + 1};
        \addplot[name path=top,draw=none] {5.3};
        \addplot[name path=bottom,draw=none] {0};
        \addplot[pattern=north west lines,pattern color=blue!30] fill
        between[of=A and top];
        \addplot[pattern=north west lines,pattern color=blue!30] fill
        between[of=C and top];
        \addplot[pattern=north west lines,pattern color=blue!30] fill
        between[of=B and bottom];
        \addplot[pattern=north west lines,pattern color=blue!30] fill
        between[of=D and bottom];
        \addplot[only marks,mark=o] coordinates {
                    (0, 4) 
            (-1, 3) (0, 3) (1, 3)
            (-1, 2) (0, 2) (1, 2)
                    (0, 1) 
        };
        \addplot[fill=red,fill opacity=0.20] fill between [of=B and bottom,soft
        clip={domain=0:1.5}];
        \addplot[fill=red,fill opacity=0.20] fill between [of=D and bottom,soft
        clip={domain=-1.5:0}];
    \end{axis} 
\end{tikzpicture}

File deletion: ch1_example1_phi3.tex

BF:BFD[5.7550] → [6.13425:13470]

BF:BFD[6.13470] → [6.13471:13471]

B:BD[6.13471] → [6.13472:14782]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=-3.3,
        xmax=3.3,
        ymin=-3.3,
        ymax=3.3,
        y=1cm,
        x=1cm,
        ytick={-3,...,3},
        xtick={-3,...,3},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        \addplot [
            % domain=-3:3,
            name path = A,
            thick,
            % pattern=north east lines,
        ] {0.5*x + 1};
        \addplot[name path=C,draw=none] {3.3};
        \addplot [
            % domain={-1.65:3},
            name path = B,
            thick,
            % pattern=north east lines,
        ] {0.5*x*x-2};
        \addplot[name path=D,draw=none] {-3.3};
        \addplot[pattern=north west lines,pattern color=blue!30] fill between[of=A and C];
        \addplot[pattern=north east lines,pattern color=red!30] fill between[of=B and D];
        \addplot[only marks,mark=o] coordinates {
                                                       (2,  2)
                                       (0,  1) (1,  1) (2,  1)        
                              (-1,  0) (0,  0) (1,  0)                
                              (-1, -1) (0, -1) (1, -1)                
        };
    \end{axis} 
\end{tikzpicture}

File deletion: ch1_example1_phi2.tex

BF:BFD[5.7550] → [6.14783:14828]

BF:BFD[6.14828] → [6.14829:14829]

B:BD[6.14829] → [6.14830:15996]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=-3.3,
        xmax=3.3,
        ymin=-3.3,
        ymax=3.3,
        y=1cm,
        x=1cm,
        ytick={-3,...,3},
        xtick={-3,...,3},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        \addplot [
            % domain={-1.65:3},
            name path = B,
            thick,
            % pattern=north east lines,
        ] {0.5*x*x-2};
        \addplot[name path=D,draw=none] {-3.3};
        \addplot[pattern=north east lines,pattern color=red!30] fill between[of=B and D];
        \addplot[only marks,mark=o] coordinates {
            (-3,  3) (-2,  3) (-1,  3) (0,  3) (1,  3) (2,  3) (3,  3)
                     (-2,  2) (-1,  2) (0,  2) (1,  2) (2,  2)        
                     (-2,  1) (-1,  1) (0,  1) (1,  1) (2,  1)        
                     (-2,  1) (-1,  1) (0,  1) (1,  1) (2,  1)        
                              (-1,  0) (0,  0) (1,  0)                
                              (-1, -1) (0, -1) (1, -1)                
        };
    \end{axis} 
\end{tikzpicture}

File deletion: ch1_example1_phi1.tex

BF:BFD[5.7550] → [6.15997:16042]

BF:BFD[6.16042] → [6.16043:16043]

B:BD[6.16043] → [6.16044:17267]

% TeX root = ../main.tex
\begin{tikzpicture}[scale=0.5]
    \begin{axis}[
        axis lines = center,
        axis on top,
        xmin=-3.3,
        xmax=3.3,
        ymin=-3.3,
        ymax=3.3,
        y=1cm,
        x=1cm,
        ytick={-3,...,3},
        xtick={-3,...,3},
        xlabel = x,
        ylabel = y,
        font=\tiny
    ]
        \addplot [
            % domain=-3:3,
            name path = A,
            thick,
            % pattern=north east lines,
        ] {0.5*x + 1};
        \addplot[name path=C,draw=none] {3.3};
        \addplot[pattern=north west lines,pattern color=blue!30] fill between[of=A and C];
        \addplot[only marks,mark=o] coordinates {
                                                      (2,  2) (3,  2)
                                      (0,  1) (1,  1) (2,  1) (3,  1)
                    (-2, -0) (-1, -0) (0, -0) (1, -0) (2, -0) (3, -0)
            (-3,-1) (-2, -1) (-1, -1) (0, -1) (1, -1) (2, -1) (3, -1)
            (-3,-2) (-2, -2) (-1, -2) (0, -2) (1, -2) (2, -2) (3, -2)
            (-3,-3) (-2, -3) (-1, -3) (0, -3) (1, -3) (2, -3) (3, -3)
        };
        \addplot[only marks,mark=o,red!80] coordinates { (0, -2) };
    \end{axis} 
\end{tikzpicture}

Replacement in figures/ch2_abstract_domains_poly.tex at line 26 [7.4691]
B:BD[7.5281] → [7.5281:5321]
```
        \addplot[mark=none,dashed] {4};
```
[7.5281]
[7.5321]
```
        \addplot[mark=none,dashed,domain={0:6}] {4};
```

Replacement in figures/ch2_abstract_domains_poly.tex at line 28 [7.4691]

B:BD[7.5343] → [7.5343:5391]

        \addplot[mark=none,dashed] {-2*x + 12};

[7.5343]

[7.5391]

        \addplot[mark=none,dashed,domain={0:6}] {-2*x + 12};

Replacement in figures/ch2_abstract_domains_poly.tex at line 30 [7.4691]
B:BD[7.5411] → [7.5411:5455]
```
        \addplot[mark=none,dashed] {x - 3};
```
[7.5411]
[7.5455]
```
        \addplot[mark=none,dashed,domain={0:6}] {x - 3};
```
Replacement in figures/ch2_abstract_domains_poly.tex at line 32 [7.4691]
B:BD[7.5471] → [7.5471:5511]
```
        \addplot[mark=none,dashed] {1};
```
[7.5471]
[7.5511]
```
        \addplot[mark=none,dashed,domain={0:6}] {1};
```

Replacement in figures/ch2_abstract_domains_poly.tex at line 34 [7.4691]

B:BD[7.5531] → [7.5531:5576]

        \addplot[mark=none,dashed] {-x + 3};

[7.5531]

[7.5576]

        \addplot[mark=none,dashed,domain={0:6}] {-x + 3};

Replacement in figures/ch2_abstract_domains_oct.tex at line 28 [7.5985]
B:BD[7.6652] → [7.6652:6692]
```
        \addplot[mark=none,dashed] {4};
```
[7.6652]
[7.6692]
```
        \addplot[mark=none,dashed,domain={0:6}] {4};
```

Replacement in figures/ch2_abstract_domains_oct.tex at line 30 [7.5985]

B:BD[7.6712] → [7.6712:6757]

        \addplot[mark=none,dashed] {-x + 8};

[7.6712]

[7.6757]

        \addplot[mark=none,dashed,domain={0:6}] {-x + 8};

Replacement in figures/ch2_abstract_domains_oct.tex at line 32 [7.5985]
B:BD[7.6779] → [7.6779:6823]
```
        \addplot[mark=none,dashed] {x - 2};
```
[7.6779]
[7.6823]
```
        \addplot[mark=none,dashed,domain={0:6}] {x - 2};
```
Replacement in figures/ch2_abstract_domains_oct.tex at line 34 [7.5985]
B:BD[7.6839] → [7.6839:6879]
```
        \addplot[mark=none,dashed] {1};
```
[7.6839]
[7.6879]
```
        \addplot[mark=none,dashed,domain={0:6}] {1};
```

Replacement in ch3_theory.tex at line 36 [5.7949]

∅:D[7.10500] → [8.710:783]

B:BD[5.7973] → [8.710:783]

\section{Partial evaluation on probabilistic programs}\label{sec:theory}

[7.10500]

[9.2054]

\section{Partial evaluation on probabilistic
programs}\label{sec:theory}\label{partialevaluation}

Replacement in ch3_theory.tex at line 683 [5.7949]
∅:D[2.11071] → [10.9199:9215]
∅:D[3.28090] → [10.9199:9215]
B:BD[10.9199] → [10.9199:9215]
```
\begin{theorem}
```
[2.11071]
[2.11072]
```
\begin{lemma}\label{thm:constrfleq}
```
Replacement in ch3_theory.tex at line 693 [5.7949]
B:BD[10.9771] → [10.9771:9785]
```
\end{theorem}
```
[10.9771]
[10.9785]
```
\end{lemma}
```

Replacement in ch3_theory.tex at line 851 [5.7949]

B:BD[3.29309] → [3.29309:29442]

            \ESs(\Cost(\Prog)) &= \sum_{i=1}^\infty i \cdot P(\Rt(\Prog)=i) 
            = \sum_{i=1}^\infty P(\Cost(\Prog) \leq i)

[3.29309]

[3.29442]

            \ESns(\Rt(\Prog')) &= \sum_{i=1}^\infty i \cdot P(\Rt(\Prog)=i) 
            = \sum_{i=1}^\infty P(\Rt(\Prog) \leq i)

Deletion in ch3_theory.tex at line 855 [5.7949]

B:BD[3.29540] → [3.29540:29916]

            \ESns(\Cost(\Prog')) &= \sum_{i=1}^\infty i \cdot P(\Rt(\Prog)=i) 
            = \sum_{i=1}^\infty P(\Cost(\Prog) \leq i) 
            = \sum_{\substack{f \in \fpath_\Prog\\ \Rt(f) \leq
            i}}^\infty \prSs(f) \\
            % & \leq \sum_{\substack{f \in \fpath_{\Prog}\\ \Rt(f) \leq i}}^\infty
            % \prSns(f) 
            % = \ESns(\Rt(\Prog'))

Replacement in ch3_theory.tex at line 860 [5.7949]

B:BD[3.30165] → [3.30165:30256]

            \Leftrightarrow \ESs(\Cost(\Prog)) &\leq \ESns(\Cost(\Prog')) \label{eq:esleq}

[3.30165]

[3.30256]

            \Leftrightarrow \ESs(\Rt(\Prog)) &\leq \ESns(\Rt(\Prog')) \label{eq:esleq}

Replacement in ch3_theory.tex at line 884 [5.7949]

B:BD[3.31372] → [3.31372:31510]

either than the original program. Note, that doesn't imply that a perfectly
tight bound for the worst-case expected runtime can be found.

[3.31372]

[3.31510]

either. Note, that doesn't imply that a perfectly tight bound for the worst-case
expected runtime can be found.

Replacement in ch3_theory.tex at line 900 [5.7949]

B:BD[3.32134] → [3.32134:32173]

        in Lemma \ref{lem:constrfleq}.

[3.32134]

[3.32173]

        in Lemma \ref{lem:constrfleq}.\todo{lemma Rückrichtung fehlt}

Replacement in ch3_theory.tex at line 940 [5.7949]

B:BD[3.33870] → [3.33870:33904]

\subsection{Expected Size bounds}

[3.33870]

[3.33904]

\section{Abstraction}\label{sec:abstraction}
In \Sref{sec:partialevaluation} the abstraction was represented by an oracle,
that decides if the location is abstracted and an abstraction function. It was
stated that Algorithm \ref{alg:evaluate_abstr} terminates if 
\begin{enumerate}
    \item the oracle eventually always decides to abstract, and 
    \item the abstraction has only a finite number of results.
\end{enumerate}
First, we will discuss some possibilities to select the locations for
abstraction, and then adapt the properties based abstraction developed by
\citeauthor{Domenech19}\cite{Domenech19} for probabilistic integer programs.

Replacement in ch3_theory.tex at line 952 [5.7949]

∅:D[10.18933] → [11.3759:3799]

∅:D[3.33905] → [11.3759:3799]

B:BD[11.3759] → [11.3759:3799]

B:BD[11.3799] → [12.394:431]

\subsection{Property based abstraction}
\label{sec:propertybasedabstraction}

[3.33905]

[11.3838]

\begin{comment}
    pro: easy to implement
    contra: 
    - abstractions are expensive
    - abstractions loose precision
    open question:
    - how to select properties
\end{comment}
The naive approach would be to abstract at every location, as it also stated in
\cite{Domenech19}. The advantage is that the implementation is easy. The
evaluated program is small and the analysis thereof fast. The disadvantage is
that a lot of evaluated control-flow is lost to the abstraction. 
The property based abstraction abstraction presented in
\Sref{sec:propertybasedabstraction} requires $\Theta(n)$ calls to the
\gls{smt}-solver which is computationally expensive. 
The primary goal of the presented \gls{cfr} via partial evaluation is to
evaluate overlapping loops in order to find easier to analyse smaller loops.
In practice, the control-flow of a loop is mostly linear. Abstracting the linear
control-flow could lead to two linear sections merging together which would
otherwise-stay separated and thus make finding tight bounds harder in the
process. 
\subsection{Abstract Loop heads}\label{ssec:loopheads}
The second method proposed by \cite{Domenech19} is to abstract only on loop
heads. Termination is guaranteed since every infinite path in the evaluation
tree of a finite program must visit some loop (and in turn the head) an infinite
number of times. With only finitely many possible abstraction results, it is
guaranteed that at some point some version repeats and the evaluation
backtracks. 
The exact definition of a loop head is unclear. For sake of termination it is
sufficient that every loop contains at least one (but possibly arbitrary)
location marked for abstraction. The intuitive candidate is the head of the loop
since that's the location where most branching will probably occur in practice.
For this implementation a loop head is defined as follows.
\begin{definition}
    A \textit{loop head} of a loop is the first location of the loop encountered
    during a depth-first search starting at the start location $l_0$. 
\end{definition}

Insertion in ch3_theory.tex at line 993 [5.7949]

[11.3839]

When selecting all loop heads for abstraction, multiple loop heads can end up on
a single loop, for when the loop is overlapping with another loop. 
\begin{figure}
    \input{figures/ch3_loopheads}
\end{figure}
(see examples \todo{} \todo{}). Detecting loops and loop-heads is further
discussed in \Sref{sec:findingloops}.
\todo{prove upper bound on program size}
% Since 
% In addition control-flow refinement was introduced to unroll loops in such a way
% that hidden branching is resolved. The heuristics presented by \cite{Domenech19}
% are focused on loops and the properties are selected for the loop heads.
% Constructing a heuristic, that is well suited for every location in the program
% is not obvious is left open for future work. 
\subsection{Property based abstraction}\label{sec:propertybasedabstraction}
\section{Sub-\gls{scc} level evaluation}

Deletion in ch3_theory.tex at line 1051 [5.7949]

∅:D[13.4125] → [8.862:1083]

B:BD[8.862] → [8.862:1083]

B:BD[8.1083] → [13.4126:6126]

\subsection{Abstract everything}
\begin{comment}
    pro: easy to implement
    contra: 
    - abstractions are expensive
    - abstractions loose precision
    open question:
    - how to select properties
\end{comment}
The naive solution would be to just abstract at every location, as it also stated
in \cite{Domenech19}. The advantage is that the implementation is easy, and the
resulting program and analysis thereof quick. 
The disadvantage is that a lot of evaluated control-flow is lost to the
abstraction. Every abstraction requires $\Theta(n)$ calls to the SMT-solver
which is computationally expensive. 
In addition control-flow refinement was introduced to unroll loops in such a way
that hidden branching is resolved. The heuristics presented by \cite{Domenech19}
are focused on loops and the properties are selected for the loop heads.
Constructing a heuristic, that is well suited for every location in the program
is not obvious is left open for future work. 
\subsection{Abstract Loop heads}\label{ssec:loopheads}
The second method proposed by \cite{Domenech19} is to abstract only on loop
heads. Termination is guaranteed since every infinite path in the evaluation
tree of a finite program must visit some loop (and in turn the head) an infinite
number of times. With only finitely many abstraction candidates (versions), it
is guaranteed that at some point some version repeats and the evaluation
backtracks. 
The exact definition of a loop head is unclear. For sake of termination it is
sufficient that every loop contains at least one (but possibly arbitrary)
location marked for abstraction. The intuitive candidate is the head of the loop
since that's the location where most branching will probably occure in practice.
For this implementation a loop head is defined as follows.
\begin{definition}
    A \textit{loop head} are the entrance locations to a loop encountered during
    a depth-first search starting at the start location $l_0$. 
\end{definition}
A loop can have multiple loop heads, when it can be entered from different
locations, or when overlapping with other loops (see examples \todo{} \todo{}).
Detecting loops and loop-heads is further discussed in \Sref{sec:findingloops}.

Deletion in ch3_theory.tex at line 1052 [5.7949]
B:BD[13.6127] → [13.6127:6168]
```
\todo{prove upper bound on program size}
```

Replacement in ch2_preliminaries.tex at line 42 [5.8115]

B:BD[14.9289] → [3.34067:34753]

Some general notation is introduced as follows. Let $\overline{\N} = \N
\union \{\infty\}$. The set of all integer polynomials over some indeterminates
$A$ is denoted by $\Z[A]$. A syntactical substitution where one symbol is
replaced by another is denoted with $[\cdot\backslash{}\cdot]$. For example
$(x<y)[x\backslash{}1] = (1 < y)$. 
For a finite set $A = {x_1,\dots,x_n}$, the process of $n$ consecutive
substitutions $[x_i\backslash{}y(i)]$ where the replacement expression $y$
varies only in some index $i$ is denoted using a shortened notation:
$[x_i\backslash{}y_i]_{x_i \in A} = [x_1\backslash{}y(1)] \dots
[x_n\backslash{}y(n)]$. For example $[x_i\backslash{}i]_{x_i\in A} =

[14.9289]

[3.34753]

First, some basic notation is introduced. Let $\overline{\N} = \N \union
\{\infty\}$. $A^*$ is the set of finite words and $\A^\omega$ is the set of
infinite words over an alphabet $A$. The set of all integer polynomials over
some indeterminates $A$ is denoted by $\Z[A]$. A syntactical substitution where
one symbol is replaced by another is denoted with $[\cdot\backslash{}\cdot]$.
For example $(x<y)[x\backslash{}1] = (1 < y)$. For a finite set $A =
{x_1,\dots,x_n}$, the process of $n$ consecutive substitutions
$[x_i\backslash{}y(i)]$ where the replacement expression $y$ varies only in some
index $i$ is denoted using a shortened notation: $[x_i\backslash{}y_i]_{x_i \in
A} = [x_1\backslash{}y(1)] \dots [x_n\backslash{}y(n)]$. For example
$[x_i\backslash{}i]_{x_i\in A} =

Replacement in ch2_preliminaries.tex at line 54 [5.8115]

B:BD[3.34832] → [3.34832:34896]

variable is replaced by its index in $A = \{x_0, \dots, x_n\}$.

[3.34832]

[14.9693]

variable is replaced by its index in $A = \{x_0, \dots, x_n\}$. The restriction
of a function $f: A \rightarrow B$ to a smaller domain $A' \subset A$ is denoted
by $f|A' : A' \rightarrow B$.

Replacement in ch2_preliminaries.tex at line 59 [5.8115]

∅:D[14.9739] → [13.10458:10613]

∅:D[7.11592] → [13.10458:10613]

B:BD[13.10458] → [13.10458:10613]

B:BD[13.10613] → [7.11593:11682]

Let $\Zs := (\Z, +, \cdot, 0, 1, \leq, <, =)$ be the structure standard integer
arithmetic, and $\Rs := (\R, +, \cdot, 0, 1, \leq, <, =)$ the structure of
standard real arithmetic. In the following $\V$ denotes a finite set of
variables $\V$.

[14.9739]

[15.162]

This section will define the foundations of various types of constraints that
are special cases of formulas of \gls{fo} logic. In the following
$\V$ denotes a finite set of variables $\V$. The set of quantifier-free formulas
of first-order logic over a variable set $A\subset\V$ is denoted with $\Phi_A$,
or simply $\Phi$, when $A=\V$. For foundations on FO-logic we'll refer to the
literature \cite{barwise1977}.
Using the $\models$ relation and $\equiv$ relation from \gls{fo} logic, the
notion of satisfiability is defined.\cite{barwise1977}
\begin{definition}[Satisfiability\cite{barwise1977}]\label{def:satisfiability}
    For a domain $A$ and a structure $\mathfrak{A} = (A, +, \cdot, 0, 1, \leq,
    <, =)$ we say a variable assignment $\beta: \V \rightarrow A$
    \textit{satisfies} the formula $\phi \in \Phi$ when $\mathfrak{A}, \beta
    \models \psi$.
    $\phi $ is \textit{satisfiable} in when an assignment $\beta: \V \rightarrow
    A$ exists such that $\mathfrak{A},\beta\models \phi$. When $\phi$ is
    satisfiable for any assignments, one writes $\mathfrak{A} \models \phi$.
\end{definition}
\begin{definition}[Solutions\cite{Domenech19}]\label{def:solutions}
    Let $\varphi \in \Phi$ be an \gls{fo}-formula. $\llbracket \varphi
    \rrbracket$ is defined as the set of all satisfying assignments or the
    \textit{solutions} of the formula $\varphi$.
\end{definition}

Replacement in ch2_preliminaries.tex at line 86 [5.8115]

B:BD[15.163] → [7.11683:11738]

\begin{definition}[Constraints]\label{def:constraints}

[15.163]

[13.10768]

\begin{definition}[Constraints\cite{bagnara2005convexpolyhedron,
    meyer2021tacas,domenech2019arxiv}\label{def:constraints}]

Replacement in ch2_preliminaries.tex at line 118 [5.8115]

B:BD[14.10715] → [14.10715:10926]

    Strict and non-strict linear constraints are a subset of their polynomial
    counterpart. For the most part we will just refer to \enquote{constraints}
    when the exact type of constraint is unimportant.

[14.10715]

[14.10926]

    Strict and non-strict linear constraints are a subset of strict polynomial
    constraints and non-strict polynomial constraints respectively. For the most
    part we will just refer to \enquote{constraints} when the distinction
    between strict and non-strict or linear and polynomial constraints is
    unimportant.

Deletion in ch2_preliminaries.tex at line 124 [5.8115]
∅:D[8.3395] → [16.956:957]
∅:D[14.10936] → [16.956:957]
∅:D[13.11347] → [16.956:957]
∅:D[7.11802] → [16.956:957]
∅:D[9.12868] → [16.956:957]
B:BD[16.956] → [16.956:957]
B:BD[16.957] → [3.34897:35053]
∅:D[15.924] → [17.482:483]
∅:D[18.1843] → [17.482:483]
∅:D[13.11443] → [17.482:483]
∅:D[3.35053] → [17.482:483]
B:BD[17.482] → [17.482:483]
B:BD[17.483] → [7.11803:11943]
B:BD[7.11943] → [14.10937:11081]
∅:D[14.11081] → [7.12095:12176]
B:BD[7.12095] → [7.12095:12176]
∅:D[7.12176] → [13.11805:11832]
B:BD[13.11805] → [13.11805:11832]
∅:D[16.1154] → [18.2203:2220]
∅:D[8.3440] → [18.2203:2220]
∅:D[13.11832] → [18.2203:2220]
B:BD[18.2203] → [18.2203:2220]
```
Constraints are a subset of formulas in \gls{fo} logic.Thus, their semantics
shall be defined accordingly using the $\models$ relation from \gls{fo} logic.
\begin{definition}[Satisfiability]\label{def:satisfiability}
    For a domain $A$ and a structure $\mathfrak{A} = (A, +, \cdot, 0, 1, \leq,
    <, =)$, a constraint $\psi \in \C$ is \textit{satisfiable} in when
    $\mathfrak{A} \models \psi$. We say a variable assignment $\beta: \V
    \rightarrow A$ \textit{satisfies} the constraint $\psi$ when $(\mathfrak{A},
    \beta) \models \psi$. 
\end{definition}
```

Replacement in ch2_preliminaries.tex at line 125 [5.8115]

B:BD[15.1087] → [14.11082:11481]

A set of constraints $C \subseteq \Lin$ is satisfiable, when their conjunction
is satisfiable and we write $\mathfrak{A} \models C$ instead of $\mathfrak{A}
\models \LAnd_{\psi_i \in C} \psi_i$. In addition whenever the structure is
evident from context, we write $\models \psi$ and $\beta \models \psi$ instead
of $\mathfrak{A} \models \psi$ and $(\mathfrak{A}, \beta) \models \psi$
respectively.

[15.1087]

[16.1249]

Constraints are a subset of formulas in \gls{fo} logic, thus, their semantics
shall be defined accordingly.

Replacement in ch2_preliminaries.tex at line 128 [5.8115]

B:BD[16.1250] → [7.12338:12389]

B:BD[7.12389] → [3.35054:35240]

∅:D[8.3474] → [16.1649:1666]

∅:D[3.35240] → [16.1649:1666]

B:BD[16.1649] → [16.1649:1666]

\begin{definition}[Solutions]\label{def:solutions}
    Let $\varphi$ be an \gls{fo}-formula. $\llbracket \varphi \rrbracket$ is
    defined as the set of all satisfying assignments or the \textit{solutions}
    of the formula $\varphi$.
\end{definition}

[16.1250]

[16.1666]

A set of constraints $C \subseteq \C$ is satisfiable, when their conjunction is
satisfiable and we write $\mathfrak{A}, \beta \models C$ instead of
$\mathfrak{A} , \beta \models \LAnd_{\psi_i \in C} \psi_i$. In addition this
thesis will only consider integer arithmetic. Let $\Zs := (\Z, +, \cdot, 0, 1,
\leq, <, =)$ be the structure standard integer arithmetic. We write $\models
\psi$ and $\beta \models \psi$ instead of $\mathfrak{Z} \models \psi$ and
$\mathfrak{Z}, \beta \models \psi$ respectively.

Replacement in ch2_preliminaries.tex at line 136 [5.8115]

B:BD[16.1667] → [3.35241:35320]

Let $\psi_1,\psi_2\in \C$ and $C \subseteq \C$, the following properties hold,

[16.1667]

[3.35320]

Let $\psi_1,\psi_2\in \C$ and $C \subseteq \C$. The following properties hold,

Replacement in ch2_preliminaries.tex at line 145 [5.8115]

B:BD[16.2047] → [7.12390:12445]

\begin{definition}[Equivalence]\label{def:equivalence}

[16.2047]

[13.12608]

\begin{definition}[Equivalence\cite{Domenech19}]\label{def:equivalence}

Replacement in ch2_preliminaries.tex at line 174 [5.8115]

B:BD[13.13698] → [3.35471:35549]

When talking about integer arithmetic one only refers to linear constraints.

[13.13698]

[8.6271]

When talking about integer arithmetic one only refers to (linear) constraints.

Replacement in ch2_preliminaries.tex at line 176 [5.8115]

∅:D[8.6272] → [18.3809:3840]

B:BD[18.3809] → [18.3809:3840]

B:BD[18.3840] → [19.25602:25814]

\begin{definition}[Entailment]
    Let $\varphi_1, \varphi_2$ be FO-formulas with variables $\V$. If
    $\llbracket \varphi_1 \rrbracket \subseteq \llbracket \varphi_2 \rrbracket$
    and we say that $\varphi_1$ \textit{entails} $\varphi_2$.

[8.6272]

[18.3996]

\begin{definition}[Entailment\cite{Domenech19}]
    Let $\varphi_1, \varphi_2 \in \Phi$. If $\llbracket \varphi_1 \rrbracket
    \subseteq \llbracket \varphi_2 \rrbracket$ and we say that $\varphi_1$
    \textit{entails} $\varphi_2$.

Replacement in ch2_preliminaries.tex at line 228 [5.8115]

B:BD[8.7627] → [7.12903:12981]

The problem of determining, if a set of constraints is satisfiable or finding

[8.7627]

[7.12981]

The problem of determining if a set of constraints is satisfiable or finding

Replacement in ch2_preliminaries.tex at line 230 [5.8115]

B:BD[7.13061] → [14.12048:12126]

researched. The theories relevant for this thesis the are the quantifier-free

[7.13061]

[14.12126]

researched. The theories relevant for this thesis are the quantifier-free

Replacement in ch2_preliminaries.tex at line 236 [5.8115]

B:BD[7.13419] → [7.13419:13732]

variables that are only relevant to the scope of a transition. In FO-logic one
would just existentially quantify the variable. However the new FO-formula
wouldn't be quantifier-free anymore. Instead a new formula is searched that has
just the same solutions when ignoring the values for the irrelevant variables.

[7.13419]

[15.2493]

variables that are only relevant to the scope of a transition. In \gls{fo} logic
one would just existentially quantify the variable. However the new \gls{fo}
formula wouldn't be quantifier-free anymore. Instead a new formula is searched
that has just the same solutions when ignoring the values for the irrelevant
variables.

Replacement in ch2_preliminaries.tex at line 243 [5.8115]

B:BD[18.4097] → [7.13733:13932]

∅:D[7.13932] → [8.8333:8413]

B:BD[8.8333] → [8.8333:8413]

B:BD[8.8413] → [7.13933:14108]

    Let $X \subseteq V$ and $\varphi$ be a quantifier-free FO-formula over the
    variables $V$ and let $\beta|_X$ denote the restriction of the assignment
    $\beta$ to the smaller to domain $X$.
    The projection of $\varphi$ onto $X$ denoted as $\text{proj}_X(\varphi)$ is
    a quantifier-free FO-formula $\varphi'$ over the variables $X$, with
    $\llbracket \varphi' \rrbracket = \set{\beta|_X}{\sigma \in \llbracket
    \varphi \rrbracket}$.

[18.4097]

[18.4436]

    Let $A \subseteq V$ and $\varphi \in \Phi$. The projection of $\varphi$ onto
    $A$ denoted as $\varphi|_A$ is a quantifier-free FO-formula $\varphi|_A\in
    \Phi_A$, with $\llbracket \varphi|_A \rrbracket = \set{\beta|_X}{\beta \in
    \llbracket \varphi \rrbracket}$.

Replacement in ch2_preliminaries.tex at line 252 [5.8115]
B:BD[14.12263] → [14.12263:12281]
```
\section{Updates}
```
[14.12263]
[14.12281]
```
\section{Updates}\label{sec:update}
```

Replacement in ch2_preliminaries.tex at line 255 [5.8115]

B:BD[14.12437] → [14.12437:12621]

whereas for updates there exists a \textit{before} and an \textit{after}. 
In this section we will only consider integer arithmetic, although using real
arithmetic works analogously.

[14.12437]

[14.12621]

whereas for updates there exists a \textit{before} and an \textit{after}.

Replacement in ch2_preliminaries.tex at line 258 [5.8115]

B:BD[14.12702] → [14.12702:12781]

\set{s : A \rightarrow \Z}{A \subseteq \V}$ be the set of integer assignments.

[14.12702]

[14.12781]

\set{s : A \rightarrow \Z}{A \subseteq \V}$ be the set of full integer
assignments.

Replacement in ch2_preliminaries.tex at line 267 [5.8115]

B:BD[14.13239] → [14.13239:13319]

    of a variable $x\in A$ \textit{after} the update is determined by $u(x)(s)$

[14.13239]

[14.13319]

    of a variable $x\in A$ \textit{after} the update is determined by $u(x)(s)$.
    Note, that $u(x)$ is a polynomial and $u(x)(s)$ is the evaluation of that
    polynomial.

Replacement in ch2_preliminaries.tex at line 284 [5.8115]
B:BD[14.13758] → [19.27303:27345]
```
\begin{lemma}[\label{lem:nonprop_update}]
```
[14.13758]
[19.27345]
```
\begin{lemma}\label{lem:nonprop_update}
```

Replacement in ch2_preliminaries.tex at line 290 [5.8115]

B:BD[19.27691] → [19.27691:27757]

    and if $s \models \varphi$, the then $s' \models u(\varphi)$.

[19.27691]

[14.13904]

    and if $s \models \varphi$, then $s' \models u(\varphi)$.

Replacement in ch2_preliminaries.tex at line 295 [5.8115]

B:BD[19.27858] → [19.27858:27903]

            u(x))|_{A'})[x'\backslash{}x] \\

[19.27858]

[19.27903]

            u(x))|_{A'})[x'\backslash{}x] \nonumber\\

Replacement in ch2_preliminaries.tex at line 297 [5.8115]

B:BD[19.27977] → [19.27977:28042]

            u(x))|_{A'})[x'\backslash{}x][x\backslash{}s'(x)] \\

[19.27977]

[19.28042]

            u(x))|_{A'})[x'\backslash{}x][x\backslash{}s'(x)] \nonumber\\

Replacement in ch2_preliminaries.tex at line 303 [5.8115]

B:BD[19.28420] → [19.28420:28473]

            u(x)))[x'\backslash{}u(s)(x)]_{x\in A}\\

[19.28420]

[19.28473]

            u(x)))[x'\backslash{}u(s)(x)]_{x\in A}\nonumber\\

Replacement in ch2_preliminaries.tex at line 305 [5.8115]

B:BD[19.28547] → [19.28547:28600]

            u(x)))[x'\backslash{}u(x)(s)]_{x\in A}\\

[19.28547]

[19.28600]

            u(x)))[x'\backslash{}u(x)(s)]_{x\in A}\nonumber\\

Replacement in ch2_preliminaries.tex at line 308 [5.8115]

B:BD[19.28715] → [19.28715:28802]

            x'[x'\backslash{}u(x)(s)]_{x_\in A} = [x'\backslash{}u(x)(s)]_{x\in A}) \\

[19.28715]

[19.28802]

            x'[x'\backslash{}u(x)(s)]_{x_\in A} = [x'\backslash{}u(x)(s)]_{x\in
            A}) \nonumber\\

Replacement in ch2_preliminaries.tex at line 314 [5.8115]

B:BD[19.29000] → [19.29000:29058]

            \varphi \Land \LAnd_{x\in A} u(x)(s) = u(x)\\

[19.29000]

[19.29058]

            \varphi \Land \LAnd_{x\in A} u(x)(s) = u(x)\nonumber\\

Replacement in ch2_preliminaries.tex at line 327 [5.8115]

B:BD[19.29646] → [19.29646:29687]

            \varphi[x\backslash{}s(x)]\\

[19.29646]

[19.29687]

            \varphi[x\backslash{}s(x)]\nonumber\\

Replacement in ch2_preliminaries.tex at line 353 [5.8115]

B:BD[7.14448] → [7.14448:14601]

constraint partitions the space into one included and one excluded part. In case
of integer arithmetic the solutions are discrete points in this space.

[7.14448]

[7.14601]

constraint partitions the space. One part is included and the other is excluded.
In case of integer arithmetic the solutions are discrete points in this space.

Replacement in ch2_preliminaries.tex at line 356 [5.8115]

B:BD[7.14602] → [7.14602:14820]

An abstract domains is a representation of those sets of points. Usually they
over-approximate the sets in order to facilitate operations. Commonly used
abstract domains are Polyhedra\cite{bagnara2005convexpolyhedron}

[7.14602]

[7.14820]

An abstract domain is a representation of those sets of points. Usually a value
over-approximates the set of points in order to facilitate operations. Commonly
used abstract domains are Polyhedra\cite{bagnara2005convexpolyhedron}

Replacement in ch2_preliminaries.tex at line 360 [5.8115]
B:BD[7.14900] → [7.14900:14927]
```
the Interval domain\cite{}
```
[7.14900]
[7.14927]
```
the Interval domain (also called Boxes)\cite{gurfinkel2010}.
```

Replacement in ch2_preliminaries.tex at line 365 [5.8115]

B:BD[7.15136] → [7.15136:15265]

projection, upper, and lower bounds. There are many more but we will focus only
on the ones important for this thesis. They all

[7.15136]

[7.15265]

projection, upper and lower bounds. There are many more but we will focus only
on the ones important for this thesis.

Deletion in ch2_preliminaries.tex at line 371 [5.8115]

B:BD[7.15493] → [7.15493:15668]

However, the intersection of two abstract values might include more values than
the solutions of the formula conjunction due to the approximative nature of
abstract domains.

Replacement in ch2_preliminaries.tex at line 376 [5.8115]

B:BD[7.15799] → [7.15799:15845]

            \input{figures/ch1_example1_phi1}

[7.15799]

[7.15845]

            \input{figures/ch2_example1_phi1}

Replacement in ch2_preliminaries.tex at line 380 [5.8115]

B:BD[7.15967] → [7.15967:16013]

            \input{figures/ch1_example1_phi2}

[7.15967]

[7.16013]

            \input{figures/ch2_example1_phi2}

Replacement in ch2_preliminaries.tex at line 384 [5.8115]

B:BD[7.16135] → [7.16135:16181]

            \input{figures/ch1_example1_phi3}

[7.16135]

[7.16181]

            \input{figures/ch2_example1_phi3}

Replacement in ch2_preliminaries.tex at line 406 [5.8115]

B:BD[7.17240] → [7.17240:17417]

    clearly equal to the intersection of both sets of solutions. While
    $\varphi_1$ and $\varphi_2$ have infinitely many solutions, the conjunction
    $\varphi_3$ has not.

[7.17240]

[7.17417]

    equal to the intersection of both sets of solutions. While $\varphi_1$ and
    $\varphi_2$ have infinitely many solutions, the conjunction $\varphi_3$ has
    not.

Replacement in ch2_preliminaries.tex at line 411 [5.8115]

B:BD[7.17432] → [7.17432:17671]

The orthogonal projection computes the projection of an FO-formula, possibly
loosing some precision in the process. Geometrically, the projection can be seen
as set of solutions projected (casting a shadow) onto the remaining dimensions.

[7.17432]

[7.17671]

The orthogonal projection computes the projection of an \gls{fo} formula.
Geometrically, the projection can be seen as set of solutions projected (casting
a shadow) onto the remaining dimensions.

Insertion in ch2_preliminaries.tex at line 416 [5.8115]

[8.8733]

    \begin{figure}
        \centering
        \input{figures/ch2_projection}
        \caption{Projecting a 2D-formula onto the $x$-axis\label{fig:orthogonal_projection}}
    \end{figure}

Replacement in ch2_preliminaries.tex at line 429 [5.8115]

B:BD[8.9186] → [8.9186:9392]

    $x$-axis like shown in \fref{fig:ex2}. 
    \begin{figure}\label{fig:ex2}
        \centering
        \input{figures/ch1_example2}
        \caption{Projecting a
        2D-constraint.}
    \end{figure}

[8.9186]

[8.9392]

    $x$-axis like shown in \fref{fig:orthogonal_projection}.

Replacement in ch2_preliminaries.tex at line 437 [5.8115]
B:BD[7.17841] → [7.17841:17856]
```
\begin{figure}
```
[7.17841]
[7.17856]
```
\begin{figure}[h]
```

Replacement in ch2_preliminaries.tex at line 462 [5.8115]

B:BD[13.14683] → [7.18641:18715]

\begin{definition}[Not necessarily closed Polyhedra]\label{def:polyhedra}

[13.14683]

[13.14736]

\begin{definition}[Not necessarily closed
    Polyhedra\cite{bagnara2005convexpolyhedron}\label{def:polyhedra}]

Replacement in ch2_preliminaries.tex at line 471 [5.8115]

B:BD[7.18875] → [7.18875:18939]

talking about integer arithmetic one refers only to polyhedra.

[7.18875]

[7.18939]

talking about integer arithmetic one refers only to polyhedra.
Polyhedra can exactly only represent linear constraints. Non-linear polynomial
constraints are usually just removed, possibly leaving dimensions unbounded in
the process. There are certainly better linear over-approximations to polynomial
constraints, but finding these would go beyond the scope of this thesis.

Replacement in ch2_preliminaries.tex at line 478 [5.8115]

B:BD[7.18940] → [7.18940:19054]

\todo{more about tightness of operations} 
\todo{say something about
overapproximation of polynomial constraints}

[7.18940]

[13.14946]

Polyhedra will be used for the partial evaluation algorithm described in chapter
\ref{ch:theory}, since in practice the partial evaluation is called only on
small sub-programs and precision is more desirable than performance.

Replacement in ch2_preliminaries.tex at line 484 [5.8115]

B:BD[13.15063] → [7.19055:19114]

intervals (see \Sref{ssec:intervals} below and polyhedra.

[13.15063]

[15.2525]

intervals (see \Sref{ssec:box}) and polyhedra (see
\Sref{ssec:polyhedra}).\cite{mine2006hosc}

Replacement in ch2_preliminaries.tex at line 487 [5.8115]

B:BD[15.2526] → [7.19115:19154]

\begin{definition}\label{def:octagons}

[15.2526]

[7.19154]

\begin{definition}[Octagons\cite{mine2006hosc,mine2001wcre}\label{def:octagons}]

Replacement in ch2_preliminaries.tex at line 489 [5.8115]

B:BD[7.19226] → [7.19226:19329]

    expressed by an a set of constraints of the form $\pm v_i \pm
    v_j \leq b$\cite{mine2001wcre}.

[7.19226]

[7.19329]

    expressed by an a set of constraints of the form $\pm v_i \pm v_j \leq b$.

Replacement in ch2_preliminaries.tex at line 493 [5.8115]

B:BD[7.19423] → [7.19423:19495]

specialization of polyhedra. Octagons are used in \gls{koat} during the

[7.19423]

[7.19495]

special case of polyhedra. Octagons are used in \gls{koat} during the

Replacement in ch2_preliminaries.tex at line 499 [5.8115]

∅:D[7.19700] → [13.15724:15804]

B:BD[13.15724] → [13.15724:15804]

domain. An closed interval $[a,b]$ with $a, b \in \R$ for a variable $v \in \V$

[7.19700]

[13.15804]

domain. A closed interval $[a,b]$ with $a, b \in \R$ for a variable $v \in \V$

Replacement in ch2_preliminaries.tex at line 503 [5.8115]
B:BD[13.15893] → [7.19701:19740]
```
\begin{definition}[Box]\label{def:box}
```
[13.15893]
[7.19740]
```
\begin{definition}[Box\cite{gurfinkel2010}\label{def:box}]
```

Replacement in ch2_preliminaries.tex at line 509 [5.8115]

B:BD[7.19909] → [7.19909:20194]

polyhedron $P$ one can find a box $P'$ that contains the polyhedron
$P$.\todo{citation or proof} 
Whenever it's acceptable to arbitrarily widen the
polyhedron, one can work with boxes instead. Boxes are computationally very
efficient, although rather imprecise, for most applications.

[7.19909]

[13.16397]

polyhedron $P$ one can find a box $P'$ that contains the polyhedron $P$. Boxes
are computationally very efficient, although rather imprecise for most
applications.

Replacement in ch2_preliminaries.tex at line 513 [5.8115]
∅:D[13.16422] → [6.21269:21291]
B:BD[15.2526] → [6.21269:21291]
```
\section{Probability}
```
[13.16398]
[16.2466]
```
\section{Probability Theory}
```

Replacement in ch2_preliminaries.tex at line 519 [5.8115]

B:BD[16.2791] → [16.2791:2869]

The field of probability and random variables is well studied. Only the core

[16.2791]

[16.2869]

The field of probability and random variables is well studied. Only the core

Replacement in ch2_preliminaries.tex at line 521 [5.8115]

B:BD[16.2945] → [6.21292:21436]

definitions from \cite{billingsley2011}. For additional information we
will refer to the literature.\cite{kraaikamp2005modern, billingsley2011}

[16.2945]

[17.1243]

definitions from \citeauthor{billingsley2011}\cite{billingsley2011}. For
additional information we'll refer to the
literature.\cite{kraaikamp2005modern, billingsley2011}

Replacement in ch2_preliminaries.tex at line 525 [5.8115]

B:BD[17.1244] → [7.20195:20704]

Imagine probabilistic event with some possible outcomes $\Omega$. For example a 
coin-toss can have arbitrary many outcomes when taking the position on the table
into account, the fact that the coin might get lost in the process etc. 
A probability measure describes the probabilities of sets of random outcomes.
For example the coin-toss on the table has a sub-set of outcomes where the
coin's head is above. The probability measure would assign a probability close
to 50\% for a somewhat normal coin-toss.

[17.1244]

[7.20704]

Imagine a probabilistic event with some possible outcomes $\Omega$. For example
a coin-toss can have arbitrary many outcomes when taking the position on the
table into account, the fact that the coin might get lost in the process etc. A
probability measure describes the probabilities of sets of random outcomes. For
example the coin-toss on the table has a sub-set of outcomes where the coin's
head is above. The probability measure would assign a probability close to 50\%
for a somewhat normal coin-toss.

Replacement in ch2_preliminaries.tex at line 541 [5.8115]

B:BD[7.21196] → [7.21196:21322]

\begin{definition}[Probability Measure]\label{def:measure}
    A set function $\mu$ on a $\sigma$-field $\F$ is a probability

[7.21196]

[7.21322]

\begin{definition}[$\sigma$-Algebra\cite{billingsley2011}]
    Let $\Omega$ be an arbitrary set. A set $A \subset 2^\Omega$ is called a
    $\sigma$-algebra (also known as $\sigma$-field) when 
    \begin{enumerate}
        \item $\Omega \in A$,
        \item $A$ is closed under complement, i.e. $B \in A$ implies $B^C \in
            A$,
        \item $A$ is closed under countable unions, i.e. $A_1, A_2 \dots, \in A$ 
            implies $\Union_{n\in\N}A_n \in A$.
    \end{enumerate}
\end{definition}
\begin{definition}[Probability Measure\cite{billingsley2011}]\label{def:measure}
    A set function $\mu$ on a $\sigma$-algebra $\F$ is a probability

Replacement in ch2_preliminaries.tex at line 572 [5.8115]

B:BD[7.21954] → [7.21954:22021]

∅:D[7.22021] → [17.1282:1345]

B:BD[17.1282] → [17.1282:1345]

\begin{definition}[Probability space]\label{def:probability_space}
    A probability space is a triple $(\Omega,\F,P)$. Where the

[7.21954]

[17.1345]

\begin{definition}[Probability space\cite{billingsley2011}]\label{def:probability_space}
    A probability space is a triple $(\Omega,\F,P)$ where the

Replacement in ch2_preliminaries.tex at line 578 [5.8115]

B:BD[17.1531] → [17.1531:2230]

B:BD[17.2577] → [17.2577:2605]

        \item $\F$ is the set of events that contains $\Omega$, is
            closed under complement, intersection and countable unions. Such a
            set is also called $\sigma$-field or $\sigma$-algebra.
            \begin{enumerate}
                \item $\Omega \in \F$ 
                \item For $A\subseteq\Omega$, if $A\in\F$ then so is
                    its complement $A^c\in\F$.
                \item For $A,B \subseteq \Omega$, if $A, B \in \F$,
                    then so is $A \cup B \in \F$.
                \item For $ A_1, A_2, \dots,A_n \subseteq \Omega$, if $A_i \in
                    \F$, then so is their union $\Union\limits_{i=1}^n
                    A_i \in \F$.
            \end{enumerate}

[17.1531]

[7.22022]

        \item $\F$ is a $\sigma$-algebra containing $\Omega$.

Replacement in ch2_preliminaries.tex at line 585 [5.8115]

B:BD[6.21517] → [6.21517:21668]

variables in formulas. Colloquially, a random variable maps the results of a
probabilistic event $\omega$ to a real value, or, the value of the random

[6.21517]

[6.21668]

variables in formulas. Informally, a random variable maps the results of a
probabilistic event $\omega$ to a real value, or the value of the random

Replacement in ch2_preliminaries.tex at line 589 [5.8115]

B:BD[15.3961] → [7.22127:22190]

\begin{definition}[Random variable]\label{def:random_variable}

[15.3961]

[6.21727]

\begin{definition}[Random variable\cite{billingsley2011}]\label{def:random_variable}

Replacement in ch2_preliminaries.tex at line 595 [5.8115]

B:BD[15.4225] → [7.22191:22265]

In the following, we will encounter discrete random variables $X : \Omega

[15.4225]

[7.22265]

In the following, we will encounter mostly discrete random variables $X : \Omega

Replacement in ch2_preliminaries.tex at line 599 [5.8115]

B:BD[6.22212] → [6.22212:22287]

B:BD[6.22287] → [7.22346:22422]

∅:D[7.22422] → [6.22366:22556]

B:BD[6.22366] → [6.22366:22556]

underlying probability space. In case of discrete random variables the are
sufficient to fully describe them. The underlying probability space becomes
irrelevant at this point, as the specific events and their probabilities are not
important to the outcome of the random variable, as long as the probability of
the outcome is fully defined.

[6.22212]

[20.0]

underlying probability space. In case of discrete random variables the
distribution is sufficient the random variable. The underlying probability space
becomes irrelevant at this point, as the specific events and their probabilities
are not important to the outcome of the random variable, as long as the
probability of the outcome is fully defined.

Replacement in ch2_preliminaries.tex at line 605 [5.8115]

B:BD[20.1] → [7.22423:22501]

∅:D[7.22501] → [6.22611:22690]

B:BD[6.22611] → [6.22611:22690]

\begin{definition}[Distribution of a random variable]\label{def:distribution}
    Let $X$ be a discrete random variable. The distribution is describe by the

[20.1]

[6.22690]

\begin{definition}[Distribution of a random variable\cite{billingsley2011}]\label{def:distribution}
    Let $X$ be a discrete random variable. The distribution is described by the

Replacement in ch2_preliminaries.tex at line 619 [5.8115]

B:BD[17.3342] → [6.23035:23286]

\begin{definition}[Support]
    For a random variable with a distribution $\mu$, the support is smallest
    Borel-set $S$ for which $\mu(S) = 1$. \todo{why borel set?} Discrete random
    variables have a countable support $S = \{S_1, S_2, \dots\}$.

[17.3342]

[6.23286]

\begin{definition}[Support\cite{billingsley2011}]
    For a random variable with a distribution $\mu$, the support is smallest set
    $S$ for which $\mu(S) = 1$. Discrete random variables have a countable
    support $S = \{S_1, S_2, \dots\}$.

Replacement in ch2_preliminaries.tex at line 635 [5.8115]

∅:D[7.22560] → [6.23811:23934]

B:BD[6.23811] → [6.23811:23934]

The Bernoulli distribution is a distribution with two possible outcomes: $1$ and $0$. For
example decided by a coin-flip.

[7.22560]

[7.22561]

The Bernoulli distribution is a distribution with two possible outcomes: $1$ and
$0$, for example decided by a coin-flip.

Replacement in ch2_preliminaries.tex at line 705 [5.8115]

B:BD[17.4442] → [6.26423:26500]

The support of a hypergeometric distribution is as follows: \todo{elaborate}

[17.4442]

[6.26500]

The support of a hypergeometric distribution is as follows:

Replacement in ch2_preliminaries.tex at line 711 [5.8115]

B:BD[6.26644] → [6.26644:26833]

The binomial distribution similar to the geometric distribution except that the
number of successes of repeated independent Bernoulli events is counted. 
Or (\enquote{with putting back}).

[6.26644]

[6.26833]

The binomial distribution is similar to the geometric distribution except that
the number of successes of repeated independent Bernoulli events is counted.

Insertion in ch2_preliminaries.tex at line 757 [5.8115]

[6.28325]

[19.30909]

When considering a random variable one is usually interested the value to expect
in general. For example most possible outcomes of a binomial distribution are
very improbable. This is described by the expected value.
\begin{definition}[Expected Value\cite{billingsley2011}]
    The expected value of a random variable $X$ on a probability space $(\Omega,
    \F, P)$ is the integral of X with respect to the measure $P$:
    \begin{equation*}
        \E(X) = \int X dP = \int_\Omega X(\omega) P(d\omega)
    \end{equation*}
    This gets simplified for discrete random variables where every the integral can
    be replaced by a sum. (see Lemma 48 in \cite{meyer20arxiv})
    \begin{equation*}
        \E(X) = \sum_{r \in \bar{\R}_{\geq0}} r \cdot P(X = r)
    \end{equation*}
\end{definition}

Replacement in ch2_preliminaries.tex at line 775 [5.8115]

∅:D[19.30977] → [9.13186:13711]

B:BD[7.22972] → [9.13186:13711]

$\Z[\V\union D]$, is the set of integer polynomials containing variables $\V$ or
distributions. They behave exactly like normal polynomials except that the
values of the distributions are sampled probabilistically instead of being given
as argument. As such we can define a function $[\cdot]: \Z[\V\union D]
\rightarrow \Sigma \rightarrow \Z \rightarrow [0,1]$ that returns the
probability that the polynomial $f \in \Z[\V \union D]$ with a state $s \in
\Sigma$ evaluates to a value $k\in\Z$ with a probability $[f](s)(k)$.

[19.30977]

[9.13711]

$\Z[\V\union \D]$, is the set of integer polynomials containing variables $\V$
or probability distributions $\D$. They behave exactly like normal polynomials
except that the values of the distributions are sampled probabilistically
instead of being given as argument. As such we can define a function $[\cdot]:
\Z[\V\union \D] \rightarrow \Sigma \rightarrow \Z \rightarrow [0,1]$ that returns
the probability that the polynomial $f \in \Z[\V \union D]$ with a state $s \in
\Sigma$ evaluates to a value $k\in\Z$ with a probability $[f](s)(k)$.

Replacement in ch2_preliminaries.tex at line 791 [5.8115]
B:BD[9.14152] → [9.14152:14166]
```
\begin{align}
```
[9.14152]
[9.14166]
```
\begin{align*}
```
Replacement in ch2_preliminaries.tex at line 798 [5.8115]
B:BD[9.14439] → [9.14439:14451]
```
\end{align}
```
[9.14439]
[9.14451]
```
\end{align*}
```
Replacement in ch2_preliminaries.tex at line 813 [5.8115]
B:BD[9.15170] → [9.15170:15191]
```
    \begin{equation}
```
[9.15170]
[9.15191]
```
    \begin{equation*}
```
Replacement in ch2_preliminaries.tex at line 818 [5.8115]
B:BD[9.15335] → [9.15335:15354]
```
    \end{equation}
```
[9.15335]
[9.15354]
```
    \end{equation*}
```

Replacement in ch2_preliminaries.tex at line 829 [5.8115]

B:BD[19.31673] → [19.31673:31753]

The support of the update $\eta A \rightarrow \Z[\V\union \D]$ on an assignment

[19.31673]

[19.31753]

The support of the update $\eta : A \rightarrow \Z[\V\union \D]$ on an assignment

Replacement in ch2_preliminaries.tex at line 834 [5.8115]

B:BD[19.31913] → [19.31913:31989]

A probabilistic polynomial is a random variable, that evaluates to a random

[19.31913]

[19.31989]

A probabilistic polynomial is a random variable that evaluates to a random

Replacement in ch2_preliminaries.tex at line 924 [5.8115]

B:BD[19.35865] → [19.35865:35928]

        By Lemma \ref{lem:nonprop_update}, follows $s' \models

[19.35865]

[19.35928]

        By Lemma \ref{lem:nonprop_update} follows $s' \models

Replacement in ch2_preliminaries.tex at line 951 [5.8115]

∅:D[7.23014] → [4.37062:37141]

B:BD[17.4731] → [4.37062:37141]

In general, an \textit{integer programs} is a program that only uses variables

[7.23014]

[20.2]

In general, an \textit{integer program} is a program that only uses variables

Replacement in ch2_preliminaries.tex at line 961 [5.8115]

B:BD[7.23432] → [7.23432:23510]

contains conditions, called \textit{guard}, that must be true for the current

[7.23432]

[7.23510]

contains a condition, called \textit{guard}, that must be true for the current

Replacement in ch2_preliminaries.tex at line 963 [5.8115]

B:BD[7.23591] → [7.23591:23826]

some updates. An update assigns a new value to a program variable depending on
the previous state. Ever inter program starts at a unique location usually
called $l_0$. Whenever no transition guard is satisfied the program terminates.

[7.23591]

[20.619]

some \textit{update}. An update assigns a new value to a program variable
depending on the previous state. Every integer program starts at a unique
location usually called $l_0$. Whenever no transition guard is satisfied the
program terminates.

Replacement in ch2_preliminaries.tex at line 989 [5.8115]

B:BD[7.24816] → [7.24816:24888]

Although similar, non-deterministic and probabilistic branching treated

[7.24816]

[7.24888]

Although similar, non-deterministic and probabilistic branching are treated

Replacement in ch2_preliminaries.tex at line 1010 [5.8115]

B:BD[7.26078] → [7.26078:26098]

    resolved first

[7.26078]

[7.26098]

    resolved first. Then if the general transition containing $t_2$ and $t_3$ is
    selected, a coin is through to decide whether to take $t_2$ or $t_3$.

Replacement in ch2_preliminaries.tex at line 1015 [5.8115]

B:BD[7.26192] → [7.26192:26266]

or probabilistic, which is also called non-deterministic or probabilistic

[7.26192]

[7.26266]

or probabilistic, which is called non-deterministic or probabilistic

Replacement in ch2_preliminaries.tex at line 1039 [5.8115]

B:BD[7.27511] → [7.27511:27584]

    Whenever temporary variable is sampled to a value not satisfying the

[7.27511]

[7.27584]

    Whenever a temporary variable is sampled to a value not satisfying the

Replacement in ch2_preliminaries.tex at line 1043 [5.8115]

B:BD[7.27674] → [7.27674:28132]

Probabilistic sampling is done using probability distributions. Coincidentally,
only the probability distributions from \Sref{ssec:distributions} are supported.
Updates are restricted to integer polynomials with variables and additionally
distributions when probabilistic sampling is allowed. The value of the
indeterminate in the polynomial is equal to the (possibly temporary) variable or
sampled from the distribution with the corresponding probability.

[7.27674]

[7.28132]

Probabilistic sampling is done using probability distributions (recall
\Sref{distributions}. Updates are restricted to integer polynomials with
variables and additionally distributions when probabilistic sampling is allowed.
The value of the indeterminate in the polynomial is equal to the (possibly
temporary) variable or sampled from the distribution with the corresponding
probability.

Replacement in ch2_preliminaries.tex at line 1075 [5.8115]

B:BD[7.29417] → [7.29417:29541]

\cite{meyer2021tacas}. First the formal definition for a probabilistic program
is given, then the semantics are introduced.

[7.29417]

[7.29541]

\cite{meyer2021tacas}. First the formal definition for a \acrfull{pip} is given,
then after a small excursion to markov decision processes, the semantics are are
defined.

Replacement in ch2_preliminaries.tex at line 1087 [5.8115]

B:BD[5.11451] → [4.38229:38286]

B:BD[4.38286] → [10.19322:19387]

        \item $\PV$ is a finite set of program variables
        \item $\Loc_\Prog$ is a finite non-empty set of location

[5.11451]

[10.19387]

        \item $\PV$ is a finite set of program variables,
        \item $\Loc_\Prog$ is a finite non-empty set of location,

Replacement in ch2_preliminaries.tex at line 1094 [5.8115]

B:BD[5.11791] → [9.15674:15742]

∅:D[9.15742] → [7.29657:29857]

B:BD[5.11856] → [7.29657:29857]

                \item a source and target location $l,l' \in \Loc$.
                \item a probability $p \geq 0$, that the transition is taken
                    when the corresponding general transition $g$ is executed. 
                \item a guard $\tau \in C$

[5.11791]

[7.29857]

                \item a source and target location $l,l' \in \Loc$,
                \item a probability $p \geq 0$ that the transition is taken
                    when the corresponding general transition $g$ is executed,
                \item a guard $\tau \in C$,

Replacement in ch2_preliminaries.tex at line 1101 [5.8115]

∅:D[9.15822] → [7.30091:30167]

B:BD[7.30091] → [7.30091:30167]

B:BD[7.30167] → [3.35634:35689]

                    g$ must share the same start location $l$, guard $τ$. 
                \item an associated cost $\kappa\in\R$

[9.15822]

[5.12342]

                    g$ must share the same start location and guard.

Replacement in ch2_preliminaries.tex at line 1104 [5.8115]

B:BD[10.19729] → [10.19729:19881]

            We call $τ_g$ the guard of the general transition $g$; and all
            transitions share a common start location which we call $l_g$.

[10.19729]

[5.12559]

            We call $τ_g$ the guard of the general transition $g$ and all
            transitions share a common start location which we call $l_g$.

Replacement in ch2_preliminaries.tex at line 1113 [5.8115]

B:BD[9.16175] → [9.16175:16566]

the same purpose. Instead of just vaguely \enquote{terminating} a program takes
the transition $g_\bot$ to the location $l_\bot$ if and only if no other
transition is walkable. Since no normal transition leaves the location $l_\bot$
the run loops indefinitely on the location $l_\bot$ after termination. In
addition a new transition $t_\text{in}$ will be used for the start of the
program.

[9.16175]

[9.16566]

the same purpose. Instead of just \enquote{terminating} a program takes the
transition $g_\bot$ to the location $l_\bot$ if and only if no other general
transitions guard is satisfied. Since no normal transition leaves the location
$l_\bot$ the run loops indefinitely on the location $l_\bot$. In addition a new
transition $t_\text{in}$ is added for the start of the program.

Replacement in ch2_preliminaries.tex at line 1120 [5.8115]

B:BD[10.19962] → [10.19962:20042]

∅:D[10.20042] → [9.16720:16795]

B:BD[9.16720] → [9.16720:16795]

\rightarrow \Z$. $\Sigma$ is the set of all states. The set of configuration is
defined as $\confs = L \union \{l_\bot\} \times \T \union \{t_{\text{in}},

[10.19962]

[10.20043]

\rightarrow \Z$. $\Sigma$ is the set of all states. The set of configurations is
defined as $\confs_\Prog = \Loc_\Prog \union \{l_\bot\} \times \T_\Prog \union \{t_{\text{in}},

Replacement in ch2_preliminaries.tex at line 1124 [5.8115]

B:BD[9.16900] → [9.16900:16981]

the current location is captured as well. This won't be relevant for the partial

[9.16900]

[9.16981]

the current location is remembered as well. This won't be relevant for the partial

Replacement in ch2_preliminaries.tex at line 1129 [5.8115]

B:BD[9.17147] → [9.17147:17223]

set of all runs is defined as $\runs = \confs^\omega$. In contrast a finite

[9.17147]

[9.17223]

set of all runs is defined as $\runs_\Prog = \confs_\Prog^\omega$. In contrast a finite

Replacement in ch2_preliminaries.tex at line 1131 [5.8115]
B:BD[9.17304] → [9.17304:17337]
```
defined as $\fpath = \confs^*$. 
```
[9.17304]
[9.17337]
```
defined as $\fpath_\Prog = \confs_\Prog^*$. 
```

Replacement in ch2_preliminaries.tex at line 1149 [5.8115]

B:BD[19.36721] → [19.36721:36800]

    \item \textit{decision epochs}, are points in time, at which a decision is

[19.36721]

[19.36800]

    \item \textit{decision epochs} are points in time at which a decision is

Replacement in ch2_preliminaries.tex at line 1151 [5.8115]

B:BD[19.36814] → [19.36814:37040]

    \item \textit{states}, the decision process is in at a decision epoch;
    \item \textit{actions}, that are selected by the decision process;
    \item \textit{transition probabilities}, that describe the probabilities of

[19.36814]

[19.37040]

    \item \textit{states} the decision process is in at a decision epoch;
    \item \textit{actions} that are selected by the decision process;
    \item \textit{transition probabilities} that describe the probabilities of

Replacement in ch2_preliminaries.tex at line 1155 [5.8115]

B:BD[19.37119] → [19.37119:37200]

    \item \textit{rewards}, that are accumulated over the whole decision process

[19.37119]

[19.37200]

    \item \textit{rewards} that are accumulated over the whole decision process

Replacement in ch2_preliminaries.tex at line 1161 [5.8115]

B:BD[19.37422] → [19.37422:37574]

the program, are the states of the decision process. Non-deterministic sampling,
non-deterministic branching are similar to choosing an action, and the

[19.37422]

[19.37574]

the program are the states of the decision process. Non-deterministic sampling
and non-deterministic branching are similar to choosing an action, and the

Replacement in ch2_preliminaries.tex at line 1166 [5.8115]

B:BD[19.37673] → [19.37673:37968]

The reward is usually the optimization goal, of the Markov decision process, and
the literature describes the properties of a given process with regard to the
highest achievable rewards. That is, one looks for a decision policy that
returns the highest accumulated rewards over a whole process.

[19.37673]

[19.37968]

The highest reward is the optimization goal, when taking decision in a Markov
decision process. One looks for a decision policy that returns the highest
accumulated rewards over a whole process. In literature\cite{puterman1994markov,
puterman1990markov}, the properties of a given process with regard to the
highest achievable rewards is researched extensively.

Replacement in ch2_preliminaries.tex at line 1173 [5.8115]

B:BD[19.38042] → [19.38042:38227]

complexity and runtime costs. If define runtime (or costs) as reward, we can
picture the Markov decision process as an adversary, finding the decision policy
with the longest runtime.

[19.38042]

[19.38227]

complexity. If one defines runtime as reward, one can picture the policy for a
Markov decision process as an adversary. We call the policy \enquote{scheduler}.

Replacement in ch2_preliminaries.tex at line 1181 [5.8115]

B:BD[19.38425] → [19.38425:38685]

    \item the states are the configurations $\confs$ of the program
    \item the actions are the selection of a general transition and full
        assignments that satisfy a guard of of the selected general transition,
        or the terminating transition.

[19.38425]

[19.38685]

    \item The states are the configurations $\confs_\Prog$ of the program.
    \item The actions are the selection of a general transition and full
        assignments that satisfy a guard of the selected general transition or
        the terminating transition.

Replacement in ch2_preliminaries.tex at line 1186 [5.8115]

B:BD[19.38747] → [19.38747:38847]

        \Sref{ssec:probabilityspace}
    \item the reward is 1 for every non terminating transition

[19.38747]

[19.38847]

        \Sref{ssec:probabilityspace}.
    \item the reward is 1 for every non terminating transition.

Replacement in ch2_preliminaries.tex at line 1191 [5.8115]

B:BD[19.38876] → [19.38876:39111]

    In general, at every decision epoch one can use a different decision rules,
    described by a policy. However, we will only consider stationary) policies,
    where the policy uses the same decision rule at every decision epoch.

[19.38876]

[19.39111]

    In general, at every decision epoch one can use a different decision rule,
    described by a policy. However, we will only consider so-called stationary
    policies, where the policy uses the same decision rule at every decision
    epoch.

Deletion in ch2_preliminaries.tex at line 1197 [5.8115]

B:BD[9.19111] → [19.39122:39278]

The adversary that uses a stationary policy to decide the non-deterministic
sampling branching and branching deterministically for us, is called scheduler.

Replacement in ch2_preliminaries.tex at line 1203 [5.8115]

∅:D[19.39603] → [9.19182:19260]

B:BD[9.19182] → [9.19182:19260]

    A function $\scheduler : \confs \rightarrow (\GT \uplus \{g_\bot\})$ is a

[19.39603]

[19.39604]

    A function $\scheduler : \confs_\Prog \rightarrow (\GT_\Prog \uplus \{g_\bot\})$ is a

Replacement in ch2_preliminaries.tex at line 1205 [5.8115]
B:BD[19.39685] → [19.39685:39733]
```
    \confs$, $\scheduler(c) = (g, s')$ implies:
```
[19.39685]
[9.19366]
```
    \confs_\Prog$, $\scheduler(c) = (g, s')$ implies:
```

Insertion in ch2_preliminaries.tex at line 1215 [5.8115]

[5.12643]

[17.6680]


    The set of all markovian schedulers for a program $\Prog$ is denoted by
    $\MDS^\Prog$, where \enquote{MD} stands for \enquote{markovian
    deterministic}.

Replacement in ch2_preliminaries.tex at line 1232 [5.8115]

B:BD[19.40576] → [19.40576:40889]

    A function $\scheduler : \fpath \rightarrow (\GT \uplus \{g_\bot\})$ is a
    history dependent scheduler if for every finite prefix $f\in\fpath$ and
    configuration $c=(l,t,s) \in
    \confs$, $\scheduler(fc) = (g, s')$ implies: items \ref{itm:md1} to
    \ref{itm:md4} of Definition \ref{def:mscheduler}.

[19.40576]

[19.40889]

    A function $\scheduler : \fpath_\Prog \rightarrow (\GT_\Prog \uplus
    \{g_\bot\})$ is a history dependent scheduler if for every finite prefix
    $f\in\fpath$ and configuration $c=(l,t,s) \in \confs_\Prog$, $\scheduler(fc)
    = (g, s')$ implies: items \ref{itm:md1} to \ref{itm:md4} of Definition
    \ref{def:mscheduler} for the last configuration $c$.
    The set of all history dependent schedulers for a program $\Prog$ is denoted
    by $\HDS^\Prog$, where \enquote{HD} stands for \enquote{history dependent
    deterministic}.

Replacement in ch2_preliminaries.tex at line 1246 [5.8115]

B:BD[19.41215] → [19.41215:41289]

every set ${r} \in \F$ for $r \in \runs$. The probability measure $\prSs$

[19.41215]

[19.41289]

every set $\{r\} \in \F$ for $r \in \runs$. The probability measure $\prSs$

Replacement in ch2_preliminaries.tex at line 1251 [5.8115]
B:BD[19.41597] → [19.41597:41618]
```
\cite{meyer20arxiv}.
```
[19.41597]
[19.41618]
```
\citeauthor{meyer20arxiv}\cite{meyer20arxiv}.
```

Replacement in ch2_preliminaries.tex at line 1258 [5.8115]

B:BD[19.42003] → [19.42003:42079]

transition. If no such transition is found of the program is already in the

[19.42003]

[19.42079]

transition. If no such transition is found or the program is already in the

Replacement in ch2_preliminaries.tex at line 1262 [5.8115]

∅:D[19.42172] → [9.19847:20280]

B:BD[4.39932] → [9.19847:20280]

Let $\scheduler$ be a scheduler and $s_0$ be an initial state. First, the
probability for a program to start at a configuration $c$ is 1 only for the
configuration that has the initial state $s_0$ at the start location $l_0$
coming from the initial transition $t_\text{in}$. All other configuration are
invalid starting configurations and get assigned a zero probability by the
probability measure $\prSs : \confs \rightarrow [0,1]$

[19.42172]

[9.20280]

Let $\scheduler \in \MDS^\Prog$ be a scheduler and $s_0$ be an initial state.
First, the probability for a program to start at a configuration $c$ is 1 only
for the configuration that has the initial state $s_0$ at the start location
$l_0$ coming from the initial transition $t_\text{in}$. All other configuration
are invalid starting configurations and get assigned a zero probability by the
probability measure $\prSs : \confs_\Prog \rightarrow [0,1]$

Replacement in ch2_preliminaries.tex at line 1269 [5.8115]
B:BD[9.20281] → [9.20281:20298]
```
\begin{equation}
```
[9.20281]
[9.20298]
```
\begin{equation*}
```
Replacement in ch2_preliminaries.tex at line 1274 [5.8115]
B:BD[9.20428] → [9.20428:20443]
```
\end{equation}
```
[9.20428]
[9.20443]
```
\end{equation*}
```

Replacement in ch2_preliminaries.tex at line 1281 [5.8115]

B:BD[19.42334] → [19.42334:42406]

the probability $p$, second the probability that each program variables

[19.42334]

[19.42406]

the probability $p$, second the probability that each program variable

Replacement in ch2_preliminaries.tex at line 1287 [5.8115]
B:BD[9.21193] → [9.21193:21207]
```
\begin{align}
```
[9.21193]
[9.21207]
```
\begin{align*}
```
Replacement in ch2_preliminaries.tex at line 1290 [5.8115]
B:BD[9.21355] → [9.21355:21367]
```
\end{align}
```
[9.21355]
[9.21367]
```
\end{align*}
```
Replacement in ch2_preliminaries.tex at line 1293 [5.8115]
B:BD[9.21397] → [9.21397:21414]
```
\begin{equation}
```
[9.21397]
[9.21414]
```
\begin{equation*}
```
Replacement in ch2_preliminaries.tex at line 1298 [5.8115]
B:BD[9.21542] → [9.21542:21557]
```
\end{equation}
```
[9.21542]
[9.21557]
```
\end{equation*}
```

Replacement in ch2_preliminaries.tex at line 1300 [5.8115]

B:BD[9.21558] → [9.21558:21638]

Naturally for all other configurations $c'$, such as configuration that are not

[9.21558]

[9.21638]

Naturally for all other configurations $c'$, such as configurations that are not

Replacement in ch2_preliminaries.tex at line 1304 [5.8115]
B:BD[9.21771] → [9.21771:21785]
```
\begin{align}
```
[9.21771]
[9.21785]
```
\begin{align*}
```
Replacement in ch2_preliminaries.tex at line 1306 [5.8115]
B:BD[9.21862] → [9.21862:21874]
```
\end{align}
```
[9.21862]
[9.21874]
```
\end{align*}
```

Replacement in ch2_preliminaries.tex at line 1309 [5.8115]

B:BD[9.21952] → [9.21952:22048]

infinite runs $\PrSs : \runs \rightarrow [0,1]$ and the probability space
$(\runs, \F, \PrSs)$.

[9.21952]

[2.18066]

infinite runs $\PrSs : \runs_\Prog \rightarrow [0,1]$ and the probability space
$(\runs_\Prog, \F, \PrSs)$.

Deletion in ch2_preliminaries.tex at line 1313 [5.8115]
B:BD[2.18124] → [2.18124:18189]
```
%     % Das ist falsch. Hier muss \tilde{s} betrachtet werden...
```

Replacement in ch2_preliminaries.tex at line 1333 [5.8115]

B:BD[9.22106] → [9.22106:22180]

    An finite prefix $f \in \fpath$ is \textit{admissible} if and only if

[9.22106]

[9.22180]

    A finite prefix $f \in \fpath_\Prog$ is \textit{admissible} if and only if

Replacement in ch2_preliminaries.tex at line 1335 [5.8115]

B:BD[9.22260] → [9.22260:22332]

    only if every finite prefix $c_0\dots c_n \in\fpath$ is admissible.

[9.22260]

[9.22332]

    only if every finite prefix $c_0\dots c_n \in\fpath_\Prog$ is admissible.

Replacement in ch2_preliminaries.tex at line 1339 [5.8115]

B:BD[9.22362] → [9.22362:22434]

    An admissible run can very well have have a zero probability if the

[9.22362]

[9.22434]

    An admissible run can very well have a zero probability if the

Replacement in ch2_preliminaries.tex at line 1348 [5.8115]

B:BD[9.22706] → [9.22706:23070]

Because by definition only the terminating transition $t_\bot$ is admissible
when the program is in the terminal location $l_\bot$ and the following
configuration must again be in the terminal location $l_\bot$. A terminating run
must end with infinitely many repetitions of a terminating configuration
$c_\bot=(l_\bot,t_\bot,s)$ for some assignment $s\in\Sigma$.

[9.22706]

[9.23070]

By definition only the terminating transition $t_\bot$ is admissible when the
program is in the terminal location $l_\bot$ and the following configuration
must again be in the terminal location $l_\bot$. A terminating run must end with
infinitely many repetitions of a terminating configuration
$c_\bot=(l_\bot,t_\bot,s)$ with some assignment $s\in\Sigma$.

Replacement in ch2_preliminaries.tex at line 1393 [5.8115]

B:BD[19.44158] → [19.44158:44232]

    expected runtime complexity $\Rt{\scheduler,s_0}(\Prog)$ of a program

[19.44158]

[19.44232]

    expected runtime complexity $\Rt_{\scheduler,s_0}(\Prog)$ of a program

Replacement in ch2_preliminaries.tex at line 1402 [5.8115]
B:BD[9.25928] → [9.25928:25947]
```
    \acrfull{past}
```
[9.25928]
[9.25947]
```
    \gls{past}.
```

Replacement in ch2_preliminaries.tex at line 1405 [5.8115]

B:BD[9.25965] → [19.44404:44479]

B:BD[19.44479] → [3.35776:35852]

The runtime complexity is a special case of the cost of a run, where every
transition has an associated cost of $\kappa_t=1$ for all $t \in \T$. Then

[9.25965]

[19.44552]

\begin{example}
    Consider the program from example \ref{ex:prob_sampling} displayed in
    \fref{fig:ex_pip_probs}. It must take at least transitions $t_1$ and $t_3$
    hence any runtime less than $2$ is impossible. The variable $x$ is
    decremented by $1$ with a probability of $0.5$ on every transition $t_2$. So
    for a given starting state $s_0$ and $scheduler \in \MDS$, the expected
    runtime depends on the initial variable $x$. The probability for decrementing
    $x$ once follows a geometric distribution. The runtime for decrementing $x$
    until zero ($x$ times) is 
    \begin{equation*}
        \ESs(\Rt(\Prog)) = s_0(x) \cdot \frac{1}{p} = s_0(x) \cdot \frac{1}{0.5} = 2
        s_0(x).
    \end{equation*}
    The expected runtime doesn't depend on the scheduler and is finite for all
    values of $x$, hence the program is \gls{past}.
\end{example}

Replacement in ch2_preliminaries.tex at line 1422 [5.8115]

B:BD[19.44553] → [19.44553:44650]

\begin{equation}
    \Rt_{\scheduler,s_0}(\Prog) = \Cost_{\scheduler, s_0}(\Prog)
\end{equation}

[19.44553]

[19.44650]

% The runtime complexity is a special case of the cost of a run, where every
% transition has an associated cost of $\kappa_t=1$ for all $t \in \T$. Then

Insertion in ch2_preliminaries.tex at line 1425 [5.8115]

[19.44651]

% \begin{equation}
%     \Rt_{\scheduler,s_0}(\Prog) = \Cost_{\scheduler, s_0}(\Prog)
% \end{equation}

Replacement in ch2_preliminaries.tex at line 1431 [5.8115]

B:BD[19.44739] → [19.44739:44816]

runtime-complexity bounds. A bound is an expression that describes the upper

[19.44739]

[19.44816]

runtime complexity bounds. A bound is an expression that describes the upper

Replacement in ch2_preliminaries.tex at line 1441 [5.8115]
B:BD[19.45228] → [19.45228:45299]
∅:D[19.45299] → [9.27299:27300]
B:BD[9.27299] → [9.27299:27300]
```
runtime complexity and cost bounds. A runtime bound is a bound on the 
```
[19.45228]
[19.45300]
```
runtime complexity and cost bounds.
```

Replacement in ch2_preliminaries.tex at line 1450 [5.8115]

B:BD[9.27315] → [19.45795:45917]

\begin{definition}[Runtime complexity bounds]
    For $s_0\in\Sigma$ and a \gls{pip} $\Prog$, $\RB^1 \in \B$ is a runtime

[9.27315]

[19.45917]

\begin{definition}[Expected runtime complexity bounds]
    For $s_0\in\Sigma$ and a \gls{pip} $\Prog$, $\RB \in \B$ is a expected runtime

Replacement in ch2_preliminaries.tex at line 1454 [5.8115]

B:BD[19.45963] → [19.45963:46023]

        \RB^1 \geq \sup \Rt(\Prog) = \sup \ESs(\Rt(\Prog)).

[19.45963]

[19.46023]

        \RB \geq \sup_{\scheduler\in\MDS}(\Rt_{\scheduler, s_0} = \sup_{\scheduler\in\MDS} (\ESs(\Rt(\Prog))).

Replacement in ch2_preliminaries.tex at line 1456 [5.8115]

B:BD[19.46043] → [19.46043:46103]

∅:D[19.46103] → [14.14230:14251]

B:BD[14.14230] → [14.14230:14251]

B:BD[14.14251] → [19.46104:46163]

∅:D[19.46163] → [14.14313:14332]

B:BD[14.14313] → [14.14313:14332]

    Analogously, $\RB \in \B$ is a cost bound for $s_0$ if 
    \begin{equation}
        \RB \geq \sup \Cost(\Prog) = \sup \ESs(\Rt(\Prog))
    \end{equation}

[19.46043]

[14.14332]

    % Analogously, $\RB \in \B$ is a cost bound for $s_0$ if 
    % \begin{equation}
    %     \RB \geq \sup \Cost(\Prog) = \sup \ESs(\Rt(\Prog))
    % \end{equation}

Insertion in ch2_preliminaries.tex at line 1571 [5.8115]
[19.51352]
[9.28027]
```
\begin{comment}
```
Insertion in ch2_preliminaries.tex at line 1796 [5.8115]
[7.39241]
Deletion in ch1_introduction.tex at line 2 [5.14309]
B:BD[21.7466] → [21.7466:7467]

Replacement in ch1_introduction.tex at line 4 [5.14309]

B:BD[21.7561] → [21.7561:7642]

computer science known to be undecidable. The so-called \textit{Halting Problem}

[21.7561]

[7.39242]

computer science known to be undecidable. The so-called Halting Problem

Replacement in ch1_introduction.tex at line 20 [5.14309]

B:BD[21.8794] → [21.8794:9265]

The tests are chosen to represent a large variety of commonly encountered
real-world programs, but also include known-to-be hard-to-solve problems in
order to challenge the competitors and improve their tools. Their collection of
test programs can be found in the \gls{tpdb} which is publicly
available\footnote{\url{https://github.com/TermCOMP/TPDB}}. During the latests
competition in 2022, eleven candidates lined up in twenty-eight
categories\cite{termcomp2022url}.

[21.8794]

[5.14332]

% The tests are chosen to represent a large variety of commonly encountered
% real-world programs, but also include known-to-be hard-to-solve problems in
% order to challenge the competitors and improve their tools. Their collection of
% test programs can be found in the \gls{tpdb} which is publicly
% available\footnote{\url{https://github.com/TermCOMP/TPDB}}. During the latests
% competition in 2022, eleven candidates lined up in twenty-eight
% categories\cite{termcomp2022url}.

Replacement in ch1_introduction.tex at line 28 [5.14309]

B:BD[5.14333] → [21.9266:9994]

\subsection{\acrshort{aprove}, \acrshort{koat}, and \acrshort{loat}}
The \gls{aprove} is developed by \citeauthor{giesl2014ijcar} at RWTH
University\cite{giesl2014ijcar}. \Gls{aprove} is capable of analyzing real-world
programming languages like Java, C, Haskell, Prolog by transforming the given
program into an equivalent \gls{trs} and then analyzing the resulting \gls{trs}
with various different techniques and tools. Explaining every technique used in
\gls{aprove} would go beyond the scope of this thesis. It should only be
mentioned that during analysis parts of the \gls{trs} can be transformed further
into \gls{its} which opens the possibility for many more analysis techniques
typically not available for \gls{trs}.

[5.14333]

[21.9994]

\section{Motivation}
\begin{figure}
    \centering
    \begin{subcaptionblock}[t]{0.4\textwidth}
        \centering
        \input{figures/ch1_classic}
        \caption{Classic integer program $\Prog_1$\label{fig:classic}}
    \end{subcaptionblock}
    \begin{subcaptionblock}[t]{0.5\textwidth}
        \centering
        \input{figures/ch1_classic_pe}
        \caption{(UNFINISHED) Partial evaluation of
        $\Prog_1$\label{fig:classic_pe}}
    \end{subcaptionblock}
    \caption{Program with hard to find runtime-complexity bounds using only
    \gls{mprf}.\cite{giesl2022arxiv}}
\end{figure}

Replacement in ch1_introduction.tex at line 46 [5.14309]

B:BD[21.9995] → [21.9995:10156]

B:BD[21.10156] → [7.40006:40590]

The tools LoAT\cite{frohn2022ijcar} and KoAT\cite{brockschmidt2016acm} are also
developed at RWTH University and aim at the finding lower and respectively upper
runtime-complexity and size bounds on transition systems. At its core,
KoAT computes bounds for subprograms using \gls{mprf} or \gls{twn}, and then
putting the subprograms together generate upper runtime-complexity and size
bounds for the whole program. 
Optionally to improve the analysis, Koat can resort to partial evaluation 
as a control-flow refinement techniques\cite{giesl2022lncs}. 
At first \gls{koat} was aimed at linear integer programs, but it was recently
extended to probabilistic integer programs\cite{meyer2021tacas} and
non-linear arithmetic\todo{citation needed}.

[21.9995]

[21.10662]

Consider the program $\Prog_1$ displayed in \fref{fig:classic}. It contains two
program variables $x, y$ and two temporary variables $u,w$ where $u$ is used to
non-deterministically sample $x$ in the first transition $t_0$ and $w$ is used
to branch non-deterministically between $t_1$ and $t_2$. The program clearly
terminates, since both loops $t_1$ and $t_2,t_3$ decrement either $x$ or $y$ in
every iteration. However, the classical analysis using only \gls{mprf} fails to
find a finite runtime-complexity bounds for this program.\cite{giesl2022arxiv}.
With the help of \gls{cfr} on sub-\gls{scc} level, the program (see
\fref{fig:classic_pe}) can be transformed into an equivalent program where the
analysis with \gls{mprf} succeeds at finding a finite runtime-complexity bound.
This technique used for the transformation was first introduced by
\citeauthor{domenech2019arxiv}\cite{domenech2019arxiv} and is called \gls{cfr}
via partial evaluation and implemented in their analysis tool
iRankfinder\cite{irankfinder2018wst}. It achieves very similar results to
\gls{mprf} when used on the entire programs or whole \gls{scc}. Its real
strength comes from applying it to a sub-\gls{scc} level and refining
specifically the loops where \gls{mprf} fail to find size bounds. This technique
was presented by \citeauthor{giesl2022arxiv}\cite{giesl2022lncs,giesl2022arxiv}
and implemented in \gls{koat}\cite{giesl2014ijcar} the complexity analysis tool
developed by \citeauthor{giesl2014ijcar} at RWTH University.

Insertion in ch1_introduction.tex at line 68 [5.14309]

[21.10663]

Underneath, \gls{koat} uses iRankFinder for the \gls{cfr}.
Recently, \gls{koat} was extended to probabilistic integer
programs\cite{meyer2021tacas,meyer20arxiv}. Unfortunately, by using iRankfinder
which is limited to non-probabilistic integer programs, the technique of
\gls{cfr} via partial evaluation remained out of reach for probabilistic
programs.
\begin{figure}
    \centering
    \begin{subcaptionblock}[t]{0.4\textwidth}
        \centering
        \input{figures/ch1_prob}
        \caption{Probabilistic integer program $\Prog_2$\label{fig:prob}}
    \end{subcaptionblock}
    \begin{subcaptionblock}[t]{0.5\textwidth}
        \centering
        \input{figures/ch1_prob_pe}
        \caption{Partial evaluation of $\Prog_2$\label{fig:prob_pe}}
    \end{subcaptionblock}
\end{figure}
Consider the very similar probabilistic integer program $\Prog_2$ displayed in
\fref{fig:prob}. The variables $x$ and $y$ are now only decremented with 50\%
probability in every iteration. The program will probably always terminate,
since a longer runtime gets increasingly unlikely. The current version of
\gls{koat} fails to find finite runtime an expected complexity bounds for this
program. It would be nice to transform $\Prog_2$ into an equivalent program like
the one shown in \fref{fig:prob_pe} similarly to the \gls{cfr} technique
presented by \citeauthor{giesl2022lncs}\cite{giesl2022lncs} and
\citeauthor{Domenech19}\cite{Domenech19}.
\section{Related works}
\subsection{\acrshort{aprove}, \acrshort{koat}, and \acrshort{loat}} The tools
LoAT\cite{frohn2022ijcar} and KoAT\cite{brockschmidt2016acm} are developed at
RWTH University and aim at the finding lower and respectively upper
runtime-complexity and size bounds on transition systems. At its core, KoAT
computes bounds for subprograms using \gls{mprf} or \gls{twn}, and then putting
the subprograms together generate upper runtime-complexity and size bounds for
the whole program. Optionally to improve the analysis, Koat can resort to
partial evaluation as a control-flow refinement techniques
on a sub-\gls{scc} level\cite{giesl2022lncs}.

WIP