Changeset - 0f7c68754475
[Not reviewed]
0 1 0
Andras Gilyen - 8 years ago 2017-09-07 19:06:22
gilyen@clayoquot.swat.cwi.nl
nicer proof
1 file changed with 4 insertions and 4 deletions:
0 comments (0 inline, 0 general)
main.tex
Show inline comments
 
@@ -399,101 +399,101 @@ and indeed the sums agree up to order $p^{k-1}=p^2$. When going up to order $p^{
 
Ideally we would now like to sum this expression over all possible paths $\xi_1,\xi_2$ and use $p_\mathrm{tot}:=\sum_{\xi\in\paths{b_i}} \mathbb{P}[\xi] = 1$ (which also holds up to arbitrary order in $p$). The above expression would then become $R_{b_1} + R_{b_2}$. However, not all paths in the sum would satisfy the independence condition so it seems we can't do this. We now argue that it works up to order $p^{k-1}$.
 
For all $\xi\in\paths{b_1\land b_2}$ we have that \emph{either} $\xi$ splits into two independent paths $\xi_1,\xi_2$ as above, \emph{or} it does not. In the latter case, when $\xi$ can not be split like that, we know $\mathbb{P}[\xi]$ contains a power $p^k$ or higher because there is a gap of size $k$  and the paths must have moved at least $k$ times `towards each other' (for example one path moves $m$ times to the right and the other path moves $k-m$ times to the left). So the total weight of such a combined path is at least order $p^k$. Therefore we have
 
\[
 
	R_{b_1\land b_2} = \sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1| + \sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_1]\mathbb{P}[\xi_2]|\xi_2| + \sum_{\mathclap{\xi\;\mathrm{dependent}}} \mathbb{P}[\xi]|\xi|.
 
\]
 
where last sum only contains only terms of order $p^{k}$ or higher. Now for the first sum, note that
 
\[
 
	\sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1|
 
    = \sum_{\xi_1\in\paths{b_1}} \sum_{\substack{\xi_2\in\paths{b_2}\\ \text{independent of }\xi_1}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1|
 
\]
 
where the sum over independent paths could be empty for certain $\xi_1$. Now we replace this last sum by a sum over \emph{all} paths $\xi_2\in\paths{b_2}$. This will change the sum but only for terms where $\xi_1,\xi_2$ are dependent. For those terms we already know that $\mathbb{P}[\xi_1]\mathbb{P}[\xi_2]$ contains a factor $p^k$ and hence we have 
 
\begin{align*}
 
    \sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1|
 
    &= \sum_{\xi_1\in\paths{b_1}} \sum_{\xi_2\in\paths{b_2}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1| + \mathcal{O}(p^k) \\
 
    &= \sum_{\xi_1\in\paths{b_1}} \mathbb{P}[\xi_1]|\xi_1| + \mathcal{O}(p^k) \\
 
    &= R_{b_1} + \mathcal{O}(p^k)
 
\end{align*}
 
we can do the same with the second term and this proves the claim.
 
\end{proof}
 

	
 
~\\
 
\textbf{Proof of claim \ref{claim:weakcancel}}: We can assume $C$ consists of a group on the left with $l$ slots and a group on the right with $r$ slots (so $r+l=|C|$), with a gap of size $k=\mathrm{gap}(C)$ between these groups. Then on the left we have strings in $\{0,1'\}^l$ as possibilities and on the right we have strings in $\{0,1'\}^r$. The combined configuration can be described by strings $f=(a,b)\in\{0,1'\}^{l+r}$. The initial probability of such a state $C(a,b)$ is $\rho_{C(a,b)} = (-1)^{|a|+|b|} p^{r+l}$ and by claim \ref{claim:expectationsum} we know $R_{C(a,b)} = R_{C(a)} + R_{C(b)} + \mathcal{O}(p^k)$ where $C(a)$ indicates that only the left slots have been filled by $a$ and the other slots are filled with $1$s. The total contribution of these configurations is therefore
 
\begin{align*}
 
    \sum_{f\in\{0,1'\}^{|C|}} \rho_{C(f)} R_{C(f)}
 
    &= \sum_{a\in\{0,1'\}^l} \sum_{b\in\{0,1'\}^r} (-1)^{|a|+|b|}p^{r+l} \left( R_{C(a)} + R_{C(b)} + \mathcal{O}(p^k) \right) \\
 
    &=\;\;\; p^{r+l}\sum_{a\in\{0,1'\}^l} (-1)^{|a|} R_{C(a)} \sum_{b\in\{0,1'\}^r} (-1)^{|b|} \\
 
    &\quad + p^{r+l}\sum_{b\in\{0,1'\}^r} (-1)^{|b|} R_{C(b)} \sum_{a\in\{0,1'\}^l} (-1)^{|a|}
 
        + \mathcal{O}(p^{r+l+k})\\
 
    &= 0 + \mathcal{O}(p^{|C|+k})
 
\end{align*}
 
where we used the identity $\sum_{a\in\{0,1\}^l} (-1)^{|a|} = 0$.
 

	
 
\newpage
 
\section{Proving the strong cancellation claim}
 
It is useful to introduce some new notation. We will consider variations of the Markov Chains:
 
\begin{itemize}
 
    \item $\P^{(n)}$ refers to the original process on the length-$n$ cycle.
 
    \item $\P^{[a,b]}$ or $\P^{[n]}$ refers to a similar Markov Chain but on a finite chain ($[a,b]$ or $[1,n]$).
 
\end{itemize}
 
The process on the finite chain has the following modification at the boundary: if a boundary site is resampled, it can not resample one of its neighbors so it ignores it and only draws two new bits.
 

	
 
%Note that an \emph{event} is a subset of all possible paths of the Markov Chain.
 
\begin{definition}[Events conditioned on starting state] \label{def:conditionedevents}
 
    For any state $b\in\{0,1\}^n$, define $\start{b}$ as the event that the starting state of the chain is the state $b$. For any event $A$, define
 
    \begin{align*}
 
        \P^{(n)}_b(A) &= \P^{(n)}(A \;|\; \start{b}) %\\
 
        %R_{b,A} &= \mathbb{E}( \#resamples \;|\; A \; , \; \start{b})
 
    \end{align*}
 
    Furthermore, for the Markov Chain on the finite chain, define
 
    Furthermore, for $v\in[n]$ we define
 
    \begin{align*}
 
        \P^{[n]}_{\partial=1}(A) &= \P^{[n]}(A \;|\; \text{boundary is initialized to }1)
 
        \P^{[n]}_{b_v=1}(A) &= \P^{[n]}(A \;|\; v\text{ is initialized to }1),
 
    \end{align*}
 
    where the boundary of $[n]$ is site $1$ and site $n$, and the boundary of $[a,b]$ are $a$ and $b$.
 
    and we define similarly $\P^{[n]}_{b_v=b_w=1}(A)$ for $v,w\in[n]$.
 
\end{definition}
 
%Note that we have $\P^{(n)}(\start{b}) = (1-p)^{|b|}p^{n-|b|}$ by definition of our Markov Chain.
 
\begin{definition}[Vertex visiting event] \label{def:visitingResamplings}
 
    Denote by $\mathrm{Z}^{(v)}$ the event that site $v$ becomes zero at any point in time before the Markov Chain terminates. Denote the complement by $\mathrm{NZ}^{(v)}$, i.e. the event that site $v$ does \emph{not} become zero before it terminates. Furthermore define $\mathrm{NZ}^{(v,w)} := \mathrm{NZ}^{(v)} \cap \mathrm{NZ}^{(w)}$, i.e. the event that \emph{both} $v$ and $w$ do not become zero before termination.
 
\end{definition}
 
%\begin{figure}
 
%	\begin{center}
 
%    	\includegraphics{diagram_groups.pdf}
 
%    \end{center}
 
%    \caption{\label{fig:separatedgroups} Illustration of setup of Lemma \ref{lemma:eventindependence}. Here $b_1,b_2\in\{0,1\}^n$ are bitstrings such that all zeroes of $b_1$ and all zeroes of $b_2$ are separated by two indices $v,w$.}
 
%\end{figure}
 
\begin{wrapfigure}{r}{0.25\textwidth}
 
    \centering
 
    \includegraphics{diagram_groups.pdf}
 
    \caption{\label{fig:separatedgroups} Lemma \ref{lemma:eventindependence}.}
 
\end{wrapfigure}
 
The following lemma considers two vertices $v,w$ that are never ``crossed'' so that two halves of the cycle become independent.\begin{lemma}[Conditional independence] \label{lemma:eventindependence} \label{claim:eventindependence}
 
    Let $b=b_1\land b_2\in\{0,1\}^n$ be a state with two groups of zeroes that are separated by at least one site inbetween, as in Figure \ref{fig:separatedgroups}. Let $v$, $w$ be any indices inbetween the groups, such that $b_1$ lies on one side of them and $b_2$ on the other, as shown in the figure. Furthermore, let $A_1$ be any event that depends only on the sites ``on the $b_1$ side of $v,w$'', and similar for $A_2$ (for example $\mathrm{Z}^{(i)}$ for an $i$ on the correct side). Then we have
 
    \begin{align*}
 
        \P^{(n)}_b(\mathrm{NZ}^{(v,w)}, A_1, A_2)
 
        &=
 
        \P^{(n)}_{b_1}(\mathrm{NZ}^{(v,w)}, A_1)
 
        \; \cdot \;
 
        \P^{(n)}_{b_2}(\mathrm{NZ}^{(v,w)}, A_2) \\
 
        \P^{(n)}_b(A_1, A_2 \mid \mathrm{NZ}^{(v,w)})
 
        &=
 
        \P^{(n)}_{b_1}(A_1 \mid \mathrm{NZ}^{(v,w)})
 
        \; \cdot \;
 
        \P^{(n)}_{b_2}(A_2 \mid \mathrm{NZ}^{(v,w)}) .%\\
 
        %R_{b,\mathrm{NZ}^{(v,w)},A_1,A_2}
 
        %&=
 
        %R_{b_1,\mathrm{NZ}^{(v,w)},A_1}
 
        %\; + \;
 
        %R_{b_2,\mathrm{NZ}^{(v,w)},A_2}
 
    \end{align*}
 
    %up to any order in $p$.
 
\end{lemma}
 

	
 
\begin{proof}
 
    From any path $\xi\in\start{b} \cap \mathrm{NZ}^{(v,w)}$ we can construct paths $\xi_1\in\start{b_1}\cap \mathrm{NZ}^{(v,w)}$ and $\xi_2\in\start{b_2}\cap\mathrm{NZ}^{(v,w)}$ as follows. Let us write the path $\xi$ as
 
    $$\xi=\left( (\text{initialize }b), (z_1, s_1, r_1), (z_2, s_2, r_2), ..., (z_{|\xi|}, s_{|\xi|}, r_{|\xi|}) \right)$$
 
    where $z_i\in[n]$ denotes the number of zeroes in the state before the $i$th step, $s_i\in [n]$ denotes the site that was resampled and $r_i\in \{0,1\}^3$ is the result of the three resampled bits. We have
 
    \begin{align*}
 
        \P^{(n)}_b[\xi] &= \P(\text{pick }s_1 | z_1) \P(r_1) \P(\text{pick }s_2 | z_2) \P(r_2) \cdots \P(\text{pick }s_{|\xi|} | z_{|\xi|}) \P(r_{|\xi|}) \\
 
                &= \frac{1}{z_1} \P(r_1) \frac{1}{z_2} \P(r_2) \cdots \frac{1}{z_{|\xi|}} \P(r_{|\xi|}) .
 
    \end{align*}
 
    To construct $\xi_1$ and $\xi_2$, start with $\xi_1 = \left( (\text{initialize }b_1) \right)$ and $\xi_2 = \left( (\text{initialize }b_2) \right)$. For each step $(z_i,s_i,r_i)$ in $\xi$ do the following: if $s_i$ is ``on the $b_1$ side of $v,w$'' then append $(z^{(1)}_i,s_i,r_i)$ to $\xi_1$ and if its ``on the $b_2$ side of $v,w$'' then append $(z^{(2)}_i,s_i,r_i)$ to $\xi_2$. Here $z^{(1)}_i$ is the number of zeroes that were on the $b_1$ side and $z^{(2)}_i$ is the number of zeroes on the $b_2$ side so we have $z_i = z^{(1)}_i + z^{(2)}_i$.
 
    %Let the resulting paths be
 
@@ -583,97 +583,97 @@ The following lemma considers two vertices $v,w$ that are never ``crossed'' so t
 

	
 
\begin{lemma}[Conditional independence 2] \label{lemma:eventindependenceNew}
 
	Let $v,w \in [n]$, and let $A$ be any event that depends only on the sites $[v,w]$ (meaning the initialization and resamples) and similarly $B$ an event that depends only on the sites $[w,v]$. (For example $\mathrm{Z}^{(s)}$ or ``$s$ has been resampled at least $k$ times'' for an $s$ on the correct interval). Then we have
 
	\begin{align*}
 
		\P^{(n)}(\mathrm{NZ}^{(v,w)}\cap A\cap B)
 
		=
 
		\P_{b_v=b_w=1}^{[v,w]}(\mathrm{NZ}^{(v,w)}\cap A)
 
		\; \cdot \;
 
		\P^{[w,v]}(\mathrm{NZ}^{(v,w)}\cap B),
 
	\end{align*}
 
	and similarly
 
	\begin{align*}
 
		\P^{[n]}(\mathrm{NZ}^{(v)}\cap A\cap B)
 
		=
 
		\P_{b_v=1}^{[v]}(\mathrm{NZ}^{(v)}\cap A)
 
		\; \cdot \;
 
		\P^{[v,n]}(\mathrm{NZ}^{(v)}\cap B)
 
	\end{align*}
 
	where there is no longer a condition on the starting state.
 
\end{lemma}
 
\begin{proof}
 
    We start by relating the different Markov Chains.
 
    If $b$ is a starting state where all the zeroes are inside an interval $[v,w]$ (not on the boundary) then we can switch between the cycle and the finite chain:
 
    \begin{align*}
 
        \P^{(n)}_{b} (\NZ{v,w} \cap A) = \P^{[v,w]}_b (\NZ{v,w}\cap A) .
 
    \end{align*}
 
    If vertex $v$ and $w$ never become zero, then the zeroes never get outside of the interval $[v,w]$ and we can ignore the entire circle and only focus on the process within $[v,w]$.
 
    We can apply this to the result of Lemma \ref{lemma:eventindependence}, to get
 
    \begin{align*}
 
        \P^{(n)}_b(\mathrm{NZ}^{(v,w)} \cap A \cap B)
 
        &=
 
        \P^{[v,w]}_{b|_{[v,w]}}(\mathrm{NZ}^{(v,w)} \cap A)
 
        \; \cdot \;
 
        \P^{[v,w]}_{b|_{[w,v]}}(\mathrm{NZ}^{(v,w)} \cap B)
 
    \end{align*}
 
    Note that this also holds if $b$ has zeroes on the boundary (i.e. $b_v=0$ or $b_w=0$), because then both sides of the equations are zero.
 
    For the starting state we have the expression $\P^{(n)}(\start{b}) = (1-p)^{|b|} p^{n-|b|}$ so it splits into a product
 
    \begin{align*}
 
        \P^{(n)}(\start{b}) = \P^{[v,w]}(\start{b|_{[v+1,w-1]}}) \;\; \P^{[w,v]}(\start{b|_{[w,v]}})
 
    \end{align*}
 
    where we have to be careful to count the boudary only once.
 
    We now have
 
    \begin{align*}
 
		\P^{(n)}(\mathrm{NZ}^{(v,w)}\cap A\cap B)
 
        &= \sum_{b\in\{0,1\}^n} \P^{(n)}_b(\mathrm{NZ}^{(v,w)}\cap A\cap B) \; \P^{(n)}(\start{b}) \\
 
        &= \sum_{b\in\{0,1\}^n}
 
            \P^{[v,w]}_{b|_{[v,w]}}(\mathrm{NZ}^{(v,w)}\cap A)
 
            \P^{[v,w]}(\start{b|_{[v+1,w-1]}})
 
            \\ &\qquad\qquad\quad
 
            \\ &\qquad\qquad\quad\cdot
 
            \P^{[w,v]}_{b|_{[w,v]}}(\mathrm{NZ}^{(v,w)}\cap B)
 
            \P^{[w,v]}(\start{b|_{[w,v]}}) \\
 
        &= \left( \sum_{\substack{b_1\in\{0,1\}^{[v,w]}\\ b_v=b_w=1}}
 
            \P^{[v,w]}_{b_1}(\mathrm{NZ}^{(v,w)}\cap A)
 
            \P^{[v,w]}(\start{b_1}) \right)
 
            \\ &\qquad \cdot
 
           \left( \sum_{b_2\in\{0,1\}^{[w,v]}}
 
            \P^{[w,v]}_{b_2}(\mathrm{NZ}^{(v,w)}\cap B)
 
            \P^{[w,v]}(\start{b_2}) \right) \\
 
        &=  \P^{[v,w]}_{b_v=b_w=1}(\mathrm{NZ}^{(v,w)}\cap A) \cdot
 
            \P^{[w,v]}(\mathrm{NZ}^{(v,w)}\cap B)
 
    \end{align*}
 
    The second equality follows in a similar way.
 
\end{proof}
 

	
 
    Some notation: let $P$ be an interval $[a,b]$. We say $P$ is a \emph{patch} when the $\Z{i}$ event holds for all $i \in [a,b]$ and $\NZ{a-1}$ and $\NZ{b+1}$ holds. We denote this event by $P\in\mathcal{P}$, so
 
	\begin{align*}
 
	P\in\mathcal{P} \equiv \NZ{a-1} \cap \Z{a} \cap \Z{a+1} \cap \cdots \cap \Z{b-1} \cap \Z{b} \cap \NZ{b+1} .
 
	\end{align*}
 
	Note that we have the following partition of the event $\Z{v}$ for any vertex $v\in[n]$:
 
	\begin{align*}
 
	\Z{v} = \dot\bigcup_{P : v\in P} (P\in\mathcal{P})
 
	\end{align*}
 

	
 
The intuition of the following lemma is that the far right can only affect the zero vertex if there is an interaction chain forming, which means that every vertex should get resampled to $0$ at least once.
 
\begin{lemma}\label{lemma:probIndepNew}
 
	$\forall n\in \mathbb{N}_+:\P^{[n]}(\Z{1})-\P^{[n+1]}(\Z{1}) = \bigO{p^{n}}$. (Should be true with $\bigO{p^{n+1}}$ as well.)
 
\end{lemma}
 
\begin{proof}
 
	The proof uses induction on $n$. For $n=1$ the statement is easy, since $\P^{[1]}(\Z{1})=p$ and $\P^{[2]}(\Z{1})=p+p^2+\bigO{p^{3}}$.
 
	
 
	Induction step: suppose we proved the claim for $n-1$, then
 
	\begin{align*}
 
	\P^{[n+1]}(\Z{1})
 
	&=\sum_{k=1}^{n+1}\P^{[n+1]}([k]\in\mathcal{P}) \tag{the events are a partition}\\
 
	&=\sum_{k=1}^{n-1}\P^{[n+1]}([k]\in\mathcal{P}) + \bigO{p^{n}}\tag*{$\left(\P^{[n+1]}([k]\in\mathcal{P})=O(p^{k})\right)$}\\	
 
	&=\sum_{k=1}^{n-1}\P^{[k+1]}_{b_{k+1}=1}([k]\in\mathcal{P})\cdot \P^{[n-k+1]}(\NZ{1})+ \bigO{p^{n}} \tag{by Claim~\ref{lemma:eventindependenceNew}}\\
 
	&=\sum_{k=1}^{n-1}\P^{[k+1]}_{b_{k+1}=1}([k]\in\mathcal{P})\cdot \left(\P^{[n-k]}(\NZ{1})+\bigO{p^{n-k}}\right)+ \bigO{p^{n}} \tag{by induction} \\	
 
	&=\sum_{k=1}^{n-1}\P^{[k+1]}_{b_{k+1}=1}([k]\in\mathcal{P})\cdot \P^{[n-k]}(\NZ{1})+ \bigO{p^{n}} \tag*{$\left(\P^{[k+1]}_{b_{k+1}=1}([k]\in\mathcal{P})=\bigO{p^{k}}\right)$}\\	
 
	&=\sum_{k=1}^{n-1}\P^{[n]}([k]\in\mathcal{P})+ \bigO{p^{n}} \tag{by Claim~\ref{lemma:eventindependenceNew}}\\
 
	&=\sum_{k=1}^{n}\P^{[n]}([k]\in\mathcal{P})+ \bigO{p^{n}} \tag*{$\left(\P^{[n]}([n]\in\mathcal{P})=\bigO{p^{n}}\right)$}\\	
 
	&=\P^{[n]}(\Z{1})	+ \bigO{p^{n}} 
 
	\end{align*}
 
\end{proof}
 
\begin{corollary}\label{cor:probIndepNew}
 
	$\P^{[n]}(\Z{1})-\P^{[m]}(\Z{1}) = \bigO{p^{\min(n,m)}}$. (Should be true with $\bigO{p^{\min(n,m)+1}}$ too.)
 
\end{corollary}
 

	
0 comments (0 inline, 0 general)