CoCalc -- main.tex

📚 The CoCalc Library - books, templates and other resources
cocalc-examples / martinthoma-latex-examples / presentations / causality-presentation / backup / main.tex
²⁰¹⁹⁶⁶ views
License: OTHER
1
%!TEX root = interventions.tex
2
\section{Interventions}
3
\subsection{Definition}
4
\begin{frame}{Interventionen}
5
    \begin{block}{Interventionsverteilung}
6
        Sei $\mathbb{P}^\mathbf{X}$ die zu einer SEM
7
        $\mathcal{S} := (\mathcal{S}, \mathbb{P}^N)$ gehörende Verteilung. \onslide<2->{Dann
8
                kann eine (oder mehr) Strukturgleichungen aus $\mathcal{S}$ ersetzt
9
                werden ohne einen Zyklus im Graphen zu erzeugen.} \onslide<3->{Die Verteilung des
10
        neuen SEM $\tilde{\mathcal{S}}$ heißt dann
11
        \textit{Interventionsverteilung}.}
12

13
        \onslide<4->{Bei den Variablen, deren Strukturgleichungen ersetzt wurden, sagt man,
14
        wurde \textit{interveniert}.}
15

16
        \onslide<5->{Die neue Verteilung wird mit
17
        \[\mathbb{P}_{\tilde{\mathcal{S}}}^{\mathbf{X}} = \mathbb{P}_{\mathcal{S}, do(X_j:=\tilde{f}(\tilde{\mathbf{PA}}_j, \tilde{N}_j))}^{\mathbf{X}}\]
18
        beschrieben.}
19

20
        \onslide<6->{Die Menge der Rauschvariablen in $\mathcal{S}$ beinhaltet nun einige
21
        \enquote{neue} und einige \enquote{alte} $N$'s. $\mathcal{S}$ muss
22
        paarweise unabhängig sein.}
23
    \end{block}
24
\end{frame}
25

26
\begin{frame}{Nieren-Beispiel}
27
    \begin{table}
28
        \begin{tabular}{lrr}
29
        \toprule
30
        ~      & \multicolumn{2}{c}{\textbf{Behandlungserfolg}}  \\
31
        \cmidrule{2-3}
32
        ~                   & \multicolumn{1}{c}{\textbf{A}} & \multicolumn{1}{c}{\textbf{B}} \\ \midrule
33
        Kleine Nierensteine & \textbf{93\%} & 87\% \\
34
        Große Nierensteine  & \textbf{73\%} & 69\% \\
35
        \textbf{Gesamt}     &          78\% & \textbf{83\%} \\
36
        \bottomrule
37
        \end{tabular}
38
    \end{table}
39

40
    \begin{figure}[!h]
41
        \centering
42
        \begin{tikzpicture}[->,>=stealth',shorten >=1pt,auto,node distance=2.5cm,
43
      thick,main node/.style={circle,fill=blue!10,draw,font=\sffamily\Large\bfseries}]
44
          \node (Z) at (1,1) {Z};
45
          \node (T) at (0,0) {T};
46
          \node (R) at (2,0) {R};
47

48
          \foreach \from/\to in {Z/T,Z/R,T/R}
49
            \draw (\from) -> (\to);
50
        \end{tikzpicture}
51
    \end{figure}
52

53
    \begin{align*}
54
        Z &= N_Z, \;\;\;& N_Z &\sim Ber(\nicefrac{1}{4})\\
55
        T &= \lfloor 2 \cdot (1-Z+N_T) \rfloor \;\;\; & N_T &\sim \mathcal{N}(0, 1)\\
56
        R &= \lfloor 2 \cdot (0.6 \cdot (1-Z) + 0.4 \cdot (1-T) + N_R) \rfloor  \;\;\; & N_R &\sim \mathcal{N}(0, 1)
57
    \end{align*}
58
\end{frame}
59

60
% \begin{frame}{Interventionen: Spezialfälle}
61
%     \begin{block}{Interventionsverteilung}
62
%         Wenn $\tilde{f}(\tilde{\mathbf{PA}_j}, \tilde{N}_j)$ eine Punktmasse
63
%         auf ein $a \in \mathbb{R}$ legt schreibt man
64
%         \[\mathbb{P}_\mathcal{S, do(X_j := \tilde{f}(\tilde{\mathbf{PA}_j}, \tilde{N}_j))}^{\mathbf{X}}\]
65
%         und nennt die Intervention
66
%         \textbf{perfekt}.\\
67

68
%         Eine Intervention mit $\tilde{\mathbf{PA}_j} = \mathbf{PA}_j$ wird
69
%         \textbf{mangelhaft} genannt.
70
%     \end{block}
71
% \end{frame}
72

73
\begin{frame}[t]{Beispiel 2.2.2: Ursache und Effekt}
74
    Es sei $\mathcal{S}$ gegeben durch
75
    \begin{align}
76
        X &= N_X\\
77
        Y &= 4 \cdot X + N_Y
78
    \end{align}
79
    mit $N_X, N_Y \overset{\text{iid}}{\sim} \mathcal{N}(0, 1)$ und den
80
    Graphen $X \rightarrow Y$.
81
    \only<2-9>{
82
        Dann gilt:
83
        \begin{align}
84
            \mathbb{P}_\mathcal{S}^Y = \mathcal{N}(0, 4^2 + 1) &\onslide<3->{\neq \mathcal{N}(8, 1)} \onslide<4->{= \mathbb{P}_{\mathcal{S}, do(X:=2)}^{Y}} \onslide<5->{= \mathbb{P}_\mathcal{S}^{Y|X=2}}\\
85
            &\onslide<6->{\neq \mathcal{N}(12, 1)} \onslide<7->{= \mathbb{P}_{\mathcal{S}, do(X:=3)}^{Y}} \onslide<8->{= \mathbb{P}_\mathcal{S}^{Y|X=3}}
86
        \end{align}
87
        \onslide<9->{$\Rightarrow$ Intervention auf $X$ beeinflusst die Verteilung von $Y$.}
88
    }
89
    \only<10-13>{
90
        Aber:
91

92
        \begin{align}
93
            \mathbb{P}_{\mathcal{S}, do(Y:=2)}^{X} &= \mathcal{N}(0, 1)\\
94
            \onslide<11->{&= \mathbb{P}_\mathcal{S}^X}\\
95
            \onslide<12->{&= \mathbb{P}_{\mathcal{S}, do(Y:=3.14159)}^{X}}\\
96
            \onslide<13->{&\neq \mathbb{P}_\mathcal{S}^{X|Y=2}}
97
        \end{align}
98
    }
99
    \only<14->{\\
100
        Beispiel: $X$ (rauchen) $\rightarrow Y$ (weiße Zähne)
101
        \begin{itemize}
102
            \item<15-> Es besteht eine Asymmetrie zwischen Ursache ($X$) und Effekt ($Y$).
103
            \item<16-> $\mathbb{P}_{\mathcal{S}, do(Y:=\tilde{N}_Y)}^{X,Y} \Rightarrow X \perp\!\!\!\perp Y$
104
            \item<17-> $\mathbb{P}_{\mathcal{S}, do(X:=\tilde{N}_X)}^{X,Y} \text{ und } Var(\tilde{N}_X) > 0 \Rightarrow X \not\perp\!\!\!\perp Y$
105
        \end{itemize}
106
    }
107
\end{frame}
108

109
\section{Totaler kausaler Effekt}
110
\subsection{Totaler kausaler Effekt}
111
\begin{frame}{Totaler kausaler Effekt}
112
    \begin{block}{Totaler kausaler Effekt}
113
        Gegeben sei ein SEM $\mathcal{S}$. Dann gibt es einen
114
        (totalen) kausalen Effekt von $X$ nach $Y$ genau dann wenn
115
        \[\exists \tilde{N}_X : X \not\!\perp\!\!\!\perp Y \text{ in } \mathbb{P}_{\mathcal{S}, do(X:=\tilde{N}_X)}^{\mathbf{X}}\]
116
        gilt.
117
    \end{block}
118
\end{frame}
119

120
\begin{frame}[t]{Totaler kausaler Effekt: Äquivalenzen}
121
    Folgende Aussagen sind äquivalent:
122

123
    \begin{enumerate}[label=(\roman*)]
124
        \item $\exists \tilde{N}_{X_1} \hphantom{\text{ mit vollem Support }}: X_1 \not\!\perp\!\!\!\perp X_2 \text{ in } \mathbb{P}_{\mathcal{S}, do(X_1:=\tilde{N}_{X_1})}^{\mathbf{X}}$
125
        \item $\exists x^\triangle \exists x^\square: \mathbb{P}_{\mathcal{S}, do(X_1:=x^\triangle)}^{X_2} \neq \mathbb{P}_{\mathcal{S}, do(X_1:=x^\square)}^{X_2}$
126
        \item $\exists x^\triangle \hphantom{\exists x^\square}: \mathbb{P}_{\mathcal{S}, do(X_1:=x^\triangle)}^{X_2} \neq \mathbb{P}_\mathcal{S}^{X_2}$.
127
        \item $\forall \tilde{N}_{X_1} \text{ mit vollem Support }: X_1 \not\!\perp\!\!\!\perp X_2 \text{ in } \mathbb{P}_{\mathcal{S}, do(X_1:=\tilde{N}_{X_1})}^{\mathbf{X}}$
128
    \end{enumerate}
129

130
    \only<2>{
131
    \textbf{Beweisplan:}\\
132
    (i) $\Rightarrow$ (ii) $\Rightarrow$ (iv) $\Rightarrow$ (i)\\
133
    $\neg$(i) $\Rightarrow$ $\neg$ (iii) äquivalent zu (iii) $\Rightarrow$ (i)\\
134
    (ii) $\Rightarrow$ (iii)
135
    }
136
    \only<3-5>{
137
        \begin{align}
138
            p_{\mathcal{S}, do(X_1:=x_1)}^{X_2}(x_2) &= \int \prod_{j \neq 1} p_j(x_j|x_{pa(j)}) \mathrm{d}x_3 \dots \mathrm{d}x_p \nonumber
139
            \only<4->{\\&= \int \prod_{j \neq 1} p_j(x_j|x_{pa(j)}) \frac{\tilde{p}(x_1)}{\tilde{p}(x_1)}\mathrm{d}x_3 \dots \mathrm{d}x_p \nonumber}
140
            \only<5->{\\&= p_{\mathcal{S}, do(X_1:=\tilde{N}_1)}^{X_2 | X_1=x_1}(x_2)\tag{A.1}\label{eq:A.1}}
141
        \end{align}
142
        \only<5->{mit $\tilde{p}(x_1) > 0$.}
143
    }
144
    \only<6>{
145
        \begin{align}
146
            X_2 \not\perp\!\!\!\perp X_1 \text{ in } \mathbb{Q} \Leftrightarrow &\exists x_1^\triangle, x_1^\square \nonumber\\
147
            &\text{mit } q(x_1^\triangle), q(x_1^\square) > 0\nonumber\\
148
            &\text{und } \mathbb{Q}^{X_2|X_1=x_1^\triangle} \neq \mathbb{Q}^{X_2 | X_1=x_1^\square}\tag{A.2}\label{eq:A.2}
149
        \end{align}
150
    }
151

152
    \only<7>{
153
        \begin{align}
154
            X_2 \not\perp\!\!\!\perp X_1 \text{ in } \mathbb{Q} \Leftrightarrow &\exists x_1^\triangle \nonumber\\
155
            &\text{mit } q(x_1^\triangle) > 0\nonumber\\
156
            &\text{und } \mathbb{Q}^{X_2|X_1=x_1^\triangle} \neq \mathbb{Q}^{X_2}\tag{A.3}\label{eq:A.3}
157
        \end{align}
158
    }
159

160
    \only<8-10>{
161
        \textbf{Beweisplan:} (i) $\Rightarrow$ (ii)\\
162
        \onslide<9->{(i) $\overset{A.2}{\Rightarrow} \exists x_1^\triangle, x_1^\square$ mit
163
        pos. Dichte unter $\tilde{N_1}$ sodass $\mathbb{P}_{\mathcal{S}, do(X_1:=\tilde{N_1})}^{X_2|X_1=x_1^\triangle} \neq \mathbb{P}_{\mathcal{S}, do(X_1:=\tilde{N_1})}^{X_2 | X_1=x^\square}$\\}
164
        \onslide<10->{$\overset{A.1}{\Rightarrow} (ii)$}
165
    }
166
    \only<11-13>{
167
        \textbf{Beweisplan:} (ii) $\Rightarrow$ (iv)\\
168
        \onslide<12->{(ii) $\overset{A.1}{\Rightarrow} \exists x_1^\triangle, x_1^\square$ mit pos. Dichte unter $\hat{N_1}$ sodass $\mathbb{P}_{\mathcal{S}, do(X_1:=\hat{N_1})}^{X_2|X_1=x_1^\triangle} \neq \mathbb{P}_{\mathcal{S}, do(X_1 := \hat{N_1})}^{X_2 | X_1 = x_1^\square}$}
169
        \onslide<13->{$\overset{A.2}{\Rightarrow} (iv)$}
170
    }
171
    \only<14>{
172
        \textbf{Beweisplan:} (iv) $\Rightarrow$ (i)\\
173
        Trivial
174
    }
175
    \only<15-17>{
176
        \textbf{Beweisplan:} $\neg$(i) $\Rightarrow$ $\neg$ (iii)\\
177
        \onslide<16->{Es gilt: $\mathbb{P}_\mathcal{S}^{X_2} = \mathbb{P}_{\mathcal{S}, do(X_1 := N_1^*)}^{X_2}$, wobei $N_1^*$ wie $\mathbb{P}_\mathcal{S}^{X_2}$ verteilt ist.\\}
178
        \onslide<17->{
179
            \begin{align}
180
                \neg (i) &\Rightarrow X_2 \perp\!\!\!\perp X_1 \text{ in } \mathbb{P}_{\mathcal{S}, do(X_1 := N_1^*)}^{\textbf{X}}\\
181
                &\overset{A.3}{\Rightarrow} \mathbb{P}_{\mathcal{S}, do(X_1 :=N_1^*)}^{X_2| X_1=x^\triangle} = \mathbb{P}_{\mathcal{S}, do(X_1 := N_1^*)}^{X_2} \;\;\;\forall x^\triangle \text{ mit } p_1(x^\triangle) > 0\\
182
                &\overset{A.1}{\Rightarrow} \mathbb{P}_{\mathcal{S}, do(X_1:=x^\triangle)}^{X_2} = \mathbb{P}_\mathcal{S}^{X_2} \;\;\; \forall x^\triangle \text{ mit } p_1(x^\triangle) > 0\\
183
                &\overset{\neg (ii)}{\Rightarrow} \neg (iii)
184
            \end{align}
185
        }
186
    }
187
    \only<18>{
188
        \textbf{Beweisplan:} (ii) $\Rightarrow$ (iii)\\
189
        Trivial (TODO: wirklich?)
190
    }
191
\end{frame}
192

193
\begin{frame}{Beispiel 2.2.6: Randomisierte Studie}
194
    \begin{itemize}
195
        \item<1-> Weise eine Behandlung $T$ zufällig (nach $\tilde{N_T}$) einem
196
              Patienten zu. Das könnte auch ein Placebo sein.
197
        \item<2-> Im SEM: Daten aus $\mathbb{P}_{\mathcal{S}, do(T:=\tilde{N_T})}^{\mathbf{X}}$
198
        \item<3-> Falls immer noch Abhängigkeit zw. Behandlung und Erfolg
199
              vorliegt $\Rightarrow T$ hat einen totalen kausalen Effekt auf
200
              den Behandlungserfolg.
201
    \end{itemize}
202
\end{frame}
203

204
\begin{frame}{Beispiel 2.2.7: Nicolai's running-and-health Beispiel}
205
    Das zugrundeliegende (\enquote{wahre}) SEM $\mathcal{S}$, welches die Daten
206
    generierte, hat die Form:
207

208
    \begin{align}
209
        A &= N_A            &&\text{mit } N_A \sim Ber(\nicefrac{1}{2})\\
210
        H &= A + N_H \mod 2 &&\text{mit } N_H \sim Ber(\nicefrac{1}{3})\\
211
        B &= H + N_B \mod 2 &&\text{mit } N_B \sim Ber(\nicefrac{1}{20})
212
    \end{align}
213

214
    mit dem Graphen $A \rightarrow H \rightarrow B$ und\\
215
    $N_A, N_H, N_B$ unabhängig.
216

217
    \begin{itemize}
218
        \item<1->  $B$ ist hilfreicher für die Vorhersage von $H$ als $A$.
219
        \item<2->  Intervention von $A$ hat auf $H$ einen größeren Einfluss als Intervention von $B$.
220
    \end{itemize}
221
\end{frame}
222

223
\begin{frame}{Proposition 2.2.9}
224
    \begin{enumerate}[label=(\roman*)]
225
        \item<1-> Falls es keinen gerichteten Pfad von $X$ nach $Y$ gibt, dann
226
                  gibt es keinen kausalen Effekt.
227
        \item<2-> Manchmal gibt es einen gerichteten Pfad, aber keinen kausalen
228
                  Effekt.
229
    \end{enumerate}
230

231
    \onslide<3->{Beweis von (i): Folgt aus der Markov-Eigenschaft des
232
                 interventierten SEMs. }\onslide<4->{Nach dem Entfernen der
233
                 in $X$ eingehenden Kanten gilt: $X$ und $Y$ sind
234
                 $d$-separiert, falls es keinen direkten Pfad von $X$ nach
235
                 $Y$ gibt. \\}
236
    \onslide<5->{Beweis von (ii) durch Gegenbeispiel: Sei
237
    \begin{align}
238
        X &= N_X\\
239
        Z &= 2X + N_Z\\
240
        Y &= 4X - 2Z + N_Y
241
    \end{align}
242
    Dann gilt: $Y = - 2N_Z + N_Y$ und daher $X \perp\!\!\!\perp$ für alle $N_X$. $\square$
243
    }
244
\end{frame}
245

246
% \begin{frame}{Nierensteine}
247
% \begin{columns}
248
%     \begin{column}{0.45\textwidth}
249
%         \begin{center}\textbf{Modell A}\end{center}
250
%     \end{column}
251
%     \begin{column}{0.45\textwidth}
252
%         \begin{center}\textbf{Modell B}\end{center}
253
%     \end{column}
254
% \end{columns}
255
% \end{frame}
256
Product

Resources

Company