lecture 22

2023-07-04 18:09:52 +02:00 · 2023-07-04 18:09:52 +02:00 · b930b586d1
commit b930b586d1
parent e944f90e3a
3 changed files with 256 additions and 0 deletions
--- a/inputs/lecture_21.tex
+++ b/inputs/lecture_21.tex
@ -119,3 +119,6 @@ is the unique solution to this problem.
 }
 Stopping times and optional stopping are very relevant for the exam,
 the Markov property is not.
+No notes will be allowed in the exam.
+Theorems from the lecture as well as
+homework exercises might be part of the exam.
--- a/inputs/lecture_22.tex
+++ b/inputs/lecture_22.tex
@ -0,0 +1,251 @@
+\lecture{22}{2023-07-04}{Intro Markov Chains II}
+\begin{goal}
+    We want to start with the basics of the theory of Markov chains.
+\end{goal}
+
+% \begin{example}[Markov chains with two states]
+%     Suppose there are two states of a phone line,
+%     $0$,``free'', or $1$, ``busy''.
+%     We assume that the state only changes at discrete units of time
+%     and model this as a sequence of random variables.
+%     Assume
+%     \begin{IEEEeqnarra*}{rCl}
+%         \bP[X_{n+1} = 0 | X_n = 0] &=& p\\
+%         \bP[X_{n+1} = 0 | X_n = 1] &=& (1-p)\\
+%         \bP[X_{n+1} = 1 | X_n = 0] &=& q\\
+%         \bP[X_{n+1} = 1 | X_n = 1] &=& (1-q)
+%     \end{IEEEeqnarra*}
+%     for some $p,q \in (0,1)$.
+%     We can write this as a matrix
+%     \begin{IEEEeqnarra*}{rCl}
+%         P &=& \begin{pmatrix}
+%             p & (1-p) \\
+%             q & (1-q)
+%         \end{pmatrix} 
+%     \end{IEEEeqnarra*}
+%     Note that the rows of this matrix sum up to $1$.
+% 
+%     Additionally, we make the following assmption:
+%     Given that at some time $n$, the phone is in state $i \in \{0,1\}$,
+%     the behavior of the phone after time $n$ does not depend
+%     on the way, the phone reached state $i$.
+% 
+%     \begin{question}
+%         Suppose $X_0 = 0$.
+%         What is the probability, that the phone will be free at times
+%         $1 \& 2$ and will become busy at time $3$,
+%         i.e.~what is  $\bP[X_1 = 0, X_2 = 0, X_3 = 1]$?
+%     \end{question}
+%     We have
+%     \begin{IEEEeqnarra*}{rCl}
+%         \bP[X_1 = 0, X_2 = 0, X_3 = 1]
+%         &=& \bP[X_3 = 0 | X_2 = 0, X_1 = 0] \bP[X_2 = 0, X_1 = 0]\\
+%         &=& \bP[X_3 = 0 | X_2 = 0] \bP[X_2 = 0, X_1 = 0]\\
+%         &=& \bP[X_3 = 0 | X_2 = 0] \bP[X_2 = 0 |  X_1 = 0] \bP[X_1 = 0]\\
+%         &=& P_{0,1} P_{0,0} P_{0,0}
+%     \end{IEEEeqnarra*}
+% 
+%     \begin{question}
+%         Assume $X_0 = 0$. What is $\bP[X_3 = 1]$?
+%     \end{question}
+%     For $\{X_3 = 1\}$ to happen, we need to look at the following
+%     disjoint events:
+% %    \begin{IEEEeqnarra*}{rCl}
+% %        \bP(\{X_3 = 1, X_2 = 0, X_1 = 0\}) &=& P_{0,1} P_{0,0}^2,\\
+% %        \bP(\{X_3 = 1, X_2 = 0, X_1 = 1\}) &=& P_{0,1}^2 P_{1,0},\\
+% %        \bP(\{X_3 = 1, X_2 = 1, X_1 = 0\}) &=& P_{0,0} P_{0,1} P_{1,1},\\
+% %        \bP(\{X_3 = 1, X_2 = 1, X_1 = 1\}) &=& P_{0,1} P_{1,1}^2.
+% %    \end{IEEEeqnarr*}
+% 
+%     More generally, consider a Matrix $P \in  (0,1)^{n \times n}$ 
+%     whose rows sum up to $1$.
+%     Then we get a Markov Chain with $n$ states
+%     by defining $\bP[X_{n+1} = i | X_{n} = j] = P_{i,j}$.
+%     
+% \end{example}
+
+\begin{definition}
+    Let $E$ denote a \vocab{discrete state space},
+    usually $E = \{1,\ldots, N\}$
+    or $E = \N$ or $E = \Z$.
+
+    Let $\alpha$ be a probability measure on $E$.
+    We say that $(p_{i,j})_{i \in  E, j \in E}$ is a
+    \vocab{transition probability matrix}, if
+    \[
+    \forall  i,j \in E .~p_{i,j} \ge 0 \land \forall  i \in E \sum_{j \in E} p_{i,j} = 1.
+    \]
+
+    Given a triplet $(E, \alpha, P)$, we say that a stochastic process $(X_n)_{n \ge 0}$,
+    i.e.~$X_n: \Omega \to E$, is a \vocab[Markov chain!discrete]%
+    {Markov chain taking values
+    on the state space $E$
+    with initial distribution $\alpha$
+    and transition probability matrix $P$},
+    if the following conditions hold:
+    \begin{enumerate}[(i)]
+        \item $\bP[X_0 = i] = \alpha(i)$
+            for all $i \in E$,
+
+        \item $\bP[X_{n+1} = i_{n+1} | X_0 = i_0, X_1 = i_1, \ldots, X_{n} = i_{n}]
+            = \bP[X_{n+1} = i_{n+1} | X_n = i_n]$
+            for all $n = 0, \ldots$, $i_0,\ldots, i_{n+1} \in E$
+            (provided $\bP[X_0 = i_0, X_1 = i_1, \ldots, X_n = i_n] \neq 0$ ).
+    \end{enumerate}
+
+\end{definition}
+\begin{fact}
+    For all $n \in  \N_0$ and $i_0,\ldots,i_n \in E$, we have
+    \[
+    \bP[X_0 = i_0, X_1 = i_1, \ldots, X_n = i_n] =
+    \alpha(i_0) \cdot p_{i_0,i_1} \cdot p_{i_1,i_2} \cdot \ldots \cdot p_{i_{n-1}, i_n}.
+    \]
+\end{fact}
+\begin{fact}
+    For all $n \in \N$, $i_n \in E$, we have
+    \[
+    \bP[X_n = i_n] = \sum_{i_0, \ldots, i_{n-1} \in E} \alpha_{i_0} p_{i_0,i_1} \cdot \ldots \cdot p_{i_{n-1}, i_n}.
+    \]
+\end{fact}
+\begin{example}[Simple random walk on $\Z$]
+    Let $E \coloneqq \Z$, $(\xi_n)_n$ i.i.d.~with $\bP[\xi_i = 1] = \bP[\xi_i = -1] = \frac{1}{2}$.
+    Let $X_0 = 0, X_n = \xi_1 + \ldots + \xi_n$.
+
+    Let $\alpha = \delta_0 \in  M_1(\Z)$.
+    Consider
+    \begin{IEEEeqnarray*}{rCl}
+        P &=&
+        \begin{pmatrix} 
+            & \ddots & \ddots & \ddots &  & & & & 0\\
+            \ldots & 0 & \frac{1}{2} & 0 & \frac{1}{2} & 0 & \ldots \\
+            & \ldots & 0 & \frac{1}{2} & 0 & \frac{1}{2} & 0 & \ldots \\
+            & & \ldots & 0 & \frac{1}{2} & 0 & \frac{1}{2} & 0 & \ldots \\
+            0 & & & & & \ddots & \ddots & \ddots & \\
+        \end{pmatrix} 
+    \end{IEEEeqnarray*}
+    
+\end{example}
+
+% \begin{example}
+%     Consider a game, where a player wins or loses $1 €$ per round of the game.
+%     Let $p$ be the probability of winning.
+%     The player plays until they lose all money.
+%     Let $X_n$ be the capital of the gambler at time $n$.
+%     Define a matrix $P$
+%     by $P_{0,0} = 1$, $P_{i,i+1} = p$, $P_{i+1,i} = (1-p)$
+%     and all other entries $0$.
+% \end{example}
+
+\begin{definition}
+    Let $E$ be a complete, separable metric space,
+    $\alpha \in  M_1(E)$.
+    For every $x \in E$,
+    let $\mathbf{P}(x, \cdot )$ be a probability measure on $E$.%
+    \footnote{$\mathbf{P}(x,\cdot )$ corresponds to a row of our matrix in the discrete case}
+   
+    Given the triples $(E, \alpha, \{\mathbf{P}(x, \cdot )\}_{x \in E})$,
+    we say that a stochastic process $(X_n)_{n \ge 0}$ 
+    is a \vocab[Markov chain]{Markov chain taking values on $E$ %
+        with starting distribution $\alpha$ %
+        and transition probability $\{\mathbf{P}(x, \cdot )\}_{x \in E}$}
+    if
+    \begin{enumerate}[(i)]
+        \item $\bP[X_0 \in  \cdot ] = \alpha(\cdot )$,
+        \item For all bounded, measurable  $f: E \to \R$,
+            \[
+            \bE[f(X_{n+1}) | \cF_n] = \bE[f(X_{n+1}) | X_n]
+            = \int_E f(y) \mathbf{P}(X_n, \dif y) \text{ a.s.}
+            \] 
+    \end{enumerate}
+    
+\end{definition}
+\begin{remark}
+    This agrees with the definition in the discrete case,
+    as all bounded, measurable $f: E\to \R$ can be approximated
+    by simple functions,
+    i.e.~(ii) from the discrete case implies (ii) from the general definition.
+\end{remark}
+\begin{notation}
+    If $\{\mathbf{P}(x, \cdot )\}_{x \in E}$ is a transition probability,
+    then for all $f: E \to  \R$ bounded and measurable,
+    define  $\mathbf{P} : \cB_{\text{bdd}}(E) \to  \cB_{\text{bdd}}$ 
+    by
+    \[
+        (\mathbf{P} f)(x) \coloneqq \int_E f(y) \mathbf{P}(x, \dif y).
+    \] 
+\end{notation}
+We get the following fundamental link between martingales and Markov chains:
+\begin{theorem}
+    \label{martingalesandmarkovchains}
+    Suppose $(E, \alpha, \{\mathbf{P}(x, \cdot )\}_{x \in E})$ 
+    is given.
+    Then a stochastic process $(X_n)_{n \ge 0}$ is a Markov chain
+    iff for every $f: E \to \R$ bounded, measurable,
+    \[
+    M_n(f) \coloneqq f(X_n) - f(X_0) - \sum_{j=1}^{n-1} (\mathbf{I} - \mathbf{P})f(X_j)
+    \] 
+    is a martingale
+    with respect to the canonical filtration of $(X_n)$.
+\end{theorem}
+\begin{proof}
+    $\implies$ 
+    Fix some bounded, measurable $f : E \to \R$.
+    Then, for all $n$, $M_n(f)$ is bounded
+    and hence $M_n(f) \in  L^1$.
+    $M_n(f)$ is $\cF_n$-measurable for all $n \in \N$.
+    
+    \begin{claim}
+        $\bE[M_{n+1}(f) | \cF_n] = M_n(f)$.
+    \end{claim}
+    \begin{subproof}
+        It suffices to show
+        $\bE[M_{n+1}(f) - M_n(f) | \cF_n] = 0$ a.s.
+
+        We have
+        \begin{IEEEeqnarray*}{rCl}
+            \bE[M_{n+1}(f) - M_n(f) | \cF_n]
+            &=& \bE[f(X_{n+1} | \cF_n] - (\mathbf{P}f)(X_n)\\
+            &\overset{\text{Markov property}}{=}& (\mathbf{P}f)(X_n) - (\mathbf{P}f)(X_n)\\
+            &=& 0
+        \end{IEEEeqnarray*}
+    \end{subproof}
+
+    $\impliedby$ 
+    Suppose $(M_n(f))_n$ is a martingale for all bounded, measurable $f$.
+    By the martingale property, we have
+    \begin{IEEEeqnarray*}{rCl}
+        \bE[f(X_{n+1}) | X_n]
+        &=& (\mathbf{P}f)(X_n)\\
+        &=& \int f(y) \mathbf{P}(X_n, \dif y)
+    \end{IEEEeqnarray*}
+    This proves (ii).
+\end{proof}
+
+\begin{definition}
+    Given $\{\mathbf{P}(x, \cdot )\}_{x \in E}$,
+    we say that $f: E \to  \R$ is \vocab{harmonic},
+    iff $f(x) = (\mathbf{P}f)(x)$
+    for all  $x \in E$.
+    We call $f$ \vocab{super-harmonic},
+    if $(\mathbf{I} - \mathbf{P}) f \ge 0$
+    and \vocab{sub-harmonic},
+    if $(\mathbf{I} - \mathbf{P}) f \le 0$.
+\end{definition}
+\begin{corollary}
+    If $f$ is (sub/super) harmonic, then for every
+    $(E, \{\mathbf{P}(x, \cdot )\}_{x \in E}, \alpha)$
+    and every Markov chain $(X_n)_{n \ge 0}$,
+    we have that
+    $f(X_n)$ is a (sub/super) martingale.
+\end{corollary}
+
+\begin{question}
+    Given a set $A$ and a function $f$ on a superset of $A$.
+    Find a function $u$, such that $u$ is harmonic,
+    and $u = f$ on $A$.
+\end{question}
+
+Let $u(x) \coloneqq  \bE_x[f(X_{T_A}]$,
+where $\bE_x$ is the expectation with respect to the Markov chain
+starting in $x$,
+and $T_A$ is the stopping time defined by the Markov chain hitting $A$.
--- a/probability_theory.tex
+++ b/probability_theory.tex
@ -46,6 +46,8 @@
 \input{inputs/lecture_20.tex}
 \input{inputs/lecture_21.tex}

+\input{inputs/lecture_22.tex}
+
 \cleardoublepage

 %\backmatter