AENC/resampling_chain Changeset - 9f86b29b20b0 · Centrum Wiskunde & Informatica (CWI)

Changeset - 9f86b29b20b0

Parent rev.

Child rev.

[Not reviewed]

0 3 0

Tom Bannink - 8 years ago 2017-05-24 16:42:56
tom.bannink@cwi.nl

Update weak claim proof and path diagram

3 files changed with 38 insertions and 20 deletions:

diagram_paths.pdf

bin+mod

diagram_paths.tex

main.tex

0 comments (0 inline, 0 general)

diagram_paths.pdf

➞

Show inline comments

binary diff not shown

diagram_paths.tex

➞

Show inline comments

@@ @@ -5,55 +5,60 @@ @@
 \usepackage{parskip}
 \usepackage{marvosym} %Lightning symbol
 \usepackage[usenames,dvipsnames]{color}
 \usepackage[hidelinks]{hyperref}
 \renewcommand*{\familydefault}{\sfdefault}
 \usepackage{bbm} %For \mathbbm{1}
 %\usepackage{bbold}
 \usepackage{tikz}
 \begin{document}
 \begin{tikzpicture}
     \draw[step=1cm,gray,dotted] (-0.9,-0.9) grid (8.9,6.9);
     \foreach \x in {0,...,7} {
         \foreach \y in {0,...,5} {
             \draw[->] (\x,\y) -- (\x+0.9,\y);
             \draw[->] (\x,\y) -- (\x,\y+0.9);
+        }
         \draw [->] (\x,6) -- (\x+0.9,6);
+    }
     \foreach \y in {0,...,5}
         \draw [->] (8,\y) -- (8,\y+0.9);
     \draw (8,-0.2) node {$n_1$};
     \draw (-0.2,6) node {$n_2$};
     \draw (4,-0.5) node {step of path 1};
     \node[rotate=90,anchor=south,xshift=3cm,yshift=0.5cm] {step of path 2};
     \draw(-0.1,-0.4) node {$b_1\land b_2$};
     \draw(8,-0.4) node {$\mathbf{1} \land b_2$};
     \draw (-0.2,6.3) node {$b_1\land\mathbf{1}$};
     \draw (8.2,6.3) node {$\mathbf{1}$};
     \draw (4,-0.5) node {$\to$ steps of $\xi_1$};
     \node[rotate=90,anchor=south,xshift=3cm,yshift=0.5cm] {$\to$ steps of $\xi_2$};
     \draw[fill,red] (0,0) circle (0.08);
     \draw[fill,red] (8,0) circle (0.05);
     \draw[fill,red] (0,6) circle (0.05);
     \draw[fill,red] (8,6) circle (0.08);
     \def\x{5};
     \def\y{3};
     \draw[fill,black] (\x,\y) circle (0.07);
     \draw[fill=white,draw=black] (\x+0.25,\y-0.26) rectangle +(0.5,0.5);
     \draw[fill=white,draw=black] (\x-0.50,\y+0.26) rectangle +(1.0,0.5);
     \draw (\x+0.5,\y) node {$p_j$};
     \draw (\x,\y+0.5) node {$1-p_j$};
     \def\x{2};
     \def\y{2};
     \draw[fill,black] (\x,\y) circle (0.07);
     \draw[fill=white,draw=black] (\x+0.25,\y-0.26) rectangle +(0.5,0.5);
     \draw[fill=white,draw=black] (\x-0.50,\y+0.26) rectangle +(1.0,0.5);
     \draw (\x+0.5,\y) node {$p_i$};
     \draw (\x,\y+0.5) node {$1-p_i$};
     \def\x{8};
     \def\y{1};
     \draw[fill,black] (\x,\y) circle (0.07);
     \draw[fill=white,draw=black] (\x-0.25,\y+0.26) rectangle +(0.5,0.5);
     \draw (\x,\y+0.5) node {$1$};

main.tex

➞

Show inline comments

@@ @@ -36,48 +36,49 @@ @@
 %\usepackage{MnSymbol}
 \newcommand{\cupdot}{\overset{.}{\cup}}
 \newcommand{\pvp}{\vec{p}{\kern 0.45mm}'}
 \DeclarePairedDelimiter\bra{\langle}{\rvert}
 \DeclarePairedDelimiter\ket{\lvert}{\rangle}
 \DeclarePairedDelimiterX\braket[2]{\langle}{\rangle}{#1 \delimsize\vert #2}
 \newcommand{\underflow}[2]{\underset{\kern-60mm \overbrace{#1} \kern-60mm}{#2}}
 \def\Ind(#1){{{\tt Ind}({#1})}}
 \def\Id{\mathrm{Id}}
 \def\Pr{\mathrm{Pr}}
 \def\Tr{\mathrm{Tr}}
 \def\im{\mathrm{im}}
 \newcommand{\bOt}[1]{\widetilde{\mathcal O}\left(#1\right)}
 \newcommand{\QMAo}{\textsf{QMA$_1$}}
 \newcommand{\BQP}{\textsf{BQP}}
 \newcommand{\NP}{\textsf{NP}}
 \newcommand{\SharpP}{\textsf{\# P}}
 \newcommand{\diam}[1]{\mathcal{D}\left(#1\right)}
 \newcommand{\paths}[1]{\mathcal{P}\left(#1\to\mathbf{1}\right)}
 \newcommand{\gapsum}[1]{\mathrm{gapsum}\left(#1\right)}
 \long\def\ignore#1{}
 \newtheorem{theorem}{Theorem}
 \newtheorem{corollary}[theorem]{Corollary}%[theorem]
 \newtheorem{lemma}[theorem]{Lemma}
 \newtheorem{prop}[theorem]{Proposition}
 \newtheorem{definition}[theorem]{Definition}
 \newtheorem{claim}[theorem]{Claim}
 \newtheorem{remark}[theorem]{Remark}
 \newenvironment{proof}
 {\noindent {\bf Proof. }}
 {{\hfill $\Box$}\\	\smallskip}
 \usepackage[final]{hyperref}
 \hypersetup{
 	colorlinks = true,
 	allcolors = {blue},
+}
 \usepackage{ifpdf}
 \ifpdf
 	\typeout{^^J *** PDF mode *** }
 %	\input{myBiblatex.tex}
@@ @@ -126,63 +127,65 @@ @@
 	We want to calculate the average number of resamplings $R^{(n)}$, which we define as the expected number of resamplings divided by $n$. For this let $\rho,\mathbbm{1}\in[0,1]^{2^n}$ be indexed with elements of $\{0,1\}^n$ such that $\rho_b=p(b)$ and $\mathbbm{1}_b=1$. Then we use that the expected number of resamplings is just the hitting time of the Markov chain:
 	\begin{align*}
 		R^{(n)}:&=\mathbb{E}(\#\{\text{resampling before termination}\})/n\\
 		&=\sum_{k=1}^{\infty}P(\text{at least } k \text{ resamplings are performed})/n\\
 		&=\sum_{k=1}^{\infty}\rho M_{(n)}^k \mathbbm{1}/n\\
 		&=\sum_{k=0}^{\infty}a^{(n)}_k p^k
 	\end{align*}
 	\begin{table}[]
 	\centering
 	\caption{Table of the coefficients $a^{(n)}_k$}
 	\label{tab:coeffs}
 	\resizebox{\columnwidth}{!}{%
 		\begin{tabular}{c|ccccccccccccccccccccc}
 			\backslashbox[10mm]{$n$}{$k$} & 0 & 1 & 2 & 3 & 4 & 5 & 6 & 7 & 8 & 9 & 10 & 11 & 12 & 13 & 14 & 15 & 16 & 17 & 18 & 19 & 20 \\		\hline
 &	0 & 1 & \cellcolor{blue!25}2 & 3+1/3 & 5.00 & 7.00 & 9.33 & 12.00 & 15.00 & 18.33 & 22.00 & 26.00 & 30.33 & 35.00 & 40.00 & 45.333 & 51.000 & 57.000 & 63.333 & 70.000 & 77.000 \\
 &	0 & 1 & 2 & \cellcolor{blue!25}3+2/3 & 6.16 & 9.66 & 14.3 & 20.33 & 27.83 & 37.00 & 48.00 & 61.00 & 76.16 & 93.66 & 113.6 & 136.33 & 161.83 & 190.33 & 222.00 & 257.00 & 295.50 \\
 &	0 & 1 & 2 & 3+2/3 & \cellcolor{blue!25}6.44 & 10.8 & 17.3 & 26.65 & 39.43 & 56.48 & 78.65 & 106.9 & 142.2 & 185.8 & 238.7 & 302.41 & 378.05 & 467.13 & 571.14 & 691.69 & 830.44 \\
 &	0 & 1 & 2 & 3+2/3 & 6.44 & \cellcolor{blue!25}11.0 & 18.5 & 30.02 & 47.10 & 71.68 & 106.0 & 152.9 & 215.4 & 297.4 & 403.1 & 537.21 & 705.25 & 913.31 & 1168.2 & 1477.4 & 1849.1 \\
 &	0 & 1 & 2 & 3+2/3 & 6.44 & 11.0 & \cellcolor{blue!25}18.7 & 31.21 & 50.83 & 80.80 & 125.3 & 189.7 & 280.8 & 407.0 & 578.6 & 808.13 & 1110.2 & 1502.6 & 2005.6 & 2643.2 & 3443.1 \\
 &	0 & 1 & 2 & 3+2/3 & 6.44 & 11.0 & 18.7 & \cellcolor{blue!25}31.44 & 52.08 & 84.95 & 136.0 & 213.6 & 328.9 & 496.5 & 735.6 & 1070.7 & 1532.5 & 2159.5 & 2998.8 & 4108.1 & 5556.7 \\
 &	0 & 1 & 2 & 3+2/3 & 6.44 & 11.0 & 18.7 & 31.44 & \cellcolor{blue!25}52.30 & 86.27 & 140.7 & 226.3 & 358.4 & 558.4 & 855.4 & 1289.0 & 1911.5 & 2791.4 & 4017.2 & 5701.4 & 7985.9 \\
 &	0 & 1 & 2 & 3+2/3 & 6.44 & 11.0 & 18.7 & 31.44 & 52.30 & \cellcolor{blue!25}86.49 & 142.1 & 231.6 & 373.4 & 594.8 & 934.4 & 1447.1 & 2209.0 & 3324.6 & 4934.8 & 7226.9 & 10447. \\
 		\end{tabular}
             \vdots \\
 & 0 & 1 & 2 & 3+2/3 & 6.44 & 11.08 & 18.76 & 31.45 & 52.31 & 86.49 & 142.33 & 233.31 & 381.17 & 621.02 & 1009.38 & \cellcolor{blue!25}1637.13 & % 2650.74 & 4285.68 & 6913.55 & 11171.2 & 18052.2
         \end{tabular}
+	}
 	\end{table}
 	We observe that this is a power series in $p$. We discovered a very regular structure in this power series. It seems that for all $k\in\mathbb{N}$ and for all $n>k$ we have that $a^{(n)}_k$ is constant, this conjecture we verified using a computer up to $n=14$.
 	\newpage
 	\noindent Based on our calculations presented in Table~\ref{tab:coeffs} and Figure~\ref{fig:coeffs_conv_radius} we make the following conjectures:
 	\begin{enumerate}[label=(\roman*)]
 		\item $\forall k\in\mathbb{N}, \forall n\geq 3 : a^{(n)}_k\geq 0$	\label{it:pos}
         (A simpler version: $\forall k>0: a_k^{(3)}=(k+1)(k+2)/6$)
 		\item $\forall k\in\mathbb{N}, \forall n>m\geq 3 : a^{(n)}_k\geq a^{(m)}_k$ \label{it:geq}
 		\item $\forall k\in\mathbb{N}, \forall n,m\geq \max(k,3) : a^{(n)}_k=a^{(m)}_k$ \label{it:const}
   		\item $\exists p_c=\lim\limits_{k\rightarrow\infty}1\left/\sqrt[k]{a_{k}^{(k+1)}}\right.$ \label{it:lim}
 	\end{enumerate}
-	We also conjecture that $p_c\approx0.62$, see Figure~\ref{fig:coeffs_conv_radius}.
+	We also conjecture that $p_c\approx0.61$, see Figure~\ref{fig:coeffs_conv_radius}.
 	\begin{figure}[!htb]\centering
 	\includegraphics[width=0.5\textwidth]{coeffs_conv_radius.pdf}
 	%\includegraphics[width=0.5\textwidth]{log_coeffs.pdf}
 	\caption{$1\left/\sqrt[k]{a_{k}^{(k+1)}}\right.$} %$\frac{1}{\sqrt[k]{a_k^{(k+1)}}}$
 	\label{fig:coeffs_conv_radius}
 	\end{figure}
     For reference, we also explicitly give formulas for $R^{(n)}(p)$ for small $n$. We also give them in terms of $q=1-p$ because they sometimes look nicer that way.
     \begin{align*}
     	R^{(3)}(p) &= \frac{1-(1-p)^3}{3(1-p)^3}
         			= \frac{1-q^3}{3q^3}\\
     	R^{(4)}(p) &= \frac{p(6-12p+10p^2-3p^3)}{6(1-p)^4}
                     = \frac{(1-q)(1+q+q^2+3q^3)}{6q^4}\\
         R^{(5)}(p) &= \frac{p(90-300p+435p^2-325p^3+136p^4-36p^5+6p^6)}{15(1-p)^5(6-2p+p^2)}\\
                    &= \frac{(1-q)(6+5q+6q^2+21q^3+46q^4+6q^6)}{15q^5(5+q^2)}
     \end{align*}
 	If statements \ref{it:pos}-\ref{it:lim} are true, then we can define the function
 	$$R^{(\infty)}(p):=\sum_{k=0}^{\infty}a^{(k+1)}_k p^k,$$
 	which would then have radius of convergence $p_c$, also it would satisfy for all $p\in[0,p_c)$ that $R^{(n)}(p)\leq R^{(\infty)}(p)$ and $\lim\limits_{n\rightarrow\infty}R^{(n)}(p)=R^{(\infty)}(p)$.
 	It would also imply, that for all $p\in(p_c,1]$ we get $R^{(n)}(p)=\Omega\left(\left(\frac{p}{p_c}\right)^{n/2}\right)$.
 	This would then imply a very strong critical behaviour. It would mean that for all $p\in[0,p_c)$ the expected number of resamplings is bounded by a constant $R^{(\infty)}(p)$ times $n$, whereas for all $p\in(p_c,1]$ the expected number of resamplings is exponentially growing in $n$.
 	\begin{center}
     	\includegraphics{diagram_gap.pdf}
     \end{center}
     \caption{\label{fig:diametergap} A configuration $C=\{1,2,4,7,9\}\subseteq[n]$ consisting of 5 slots shown by the red dots. The dotted line at the top depicts the rest of the circle which may be much larger. The diameter of this configuration is $\diam{C}=9$ as shown and the largest gap of $C$ is $\mathrm{gap}(C)=2$. Note that we do not count the rest of the circle as a gap, we only consider gaps within the diameter of $C$.}
 \end{figure}
 \begin{claim}[Strong cancellation claim] \label{claim:strongcancel}
 	The lowest order term in
     \begin{align*}
         \sum_{f\in\{0,1'\}^{|C|}} \rho_{C(f)} R_{C(f)} ,
     \end{align*}
 	is $p^{\diam{C}}$ when $n$ is large enough. All lower order terms cancel out.
 \end{claim}
 Example: for $C_0=\{1,2,4,7,9\}$ (the configuration shown in Figure \ref{fig:diametergap}) we computed the quantity up to order $p^{20}$ in an infinite system:
 \begin{align*}
 	\sum_{f\in\{0,1'\}^{|C_0|}} \rho_{C_0(f)} R_{C_0(f)} &= 0.0240278 p^{9} + 0.235129 p^{10} + 1.24067 p^{11} + 4.71825 p^{12} \\
     &\quad + 14.5555 p^{13} + 38.8307 p^{14} + 93.2179 p^{15} + 206.837 p^{16}\\
     &\quad + 432.302 p^{17} + 862.926 p^{18} + 1662.05 p^{19} + 3112.9 p^{20} + \mathcal{O}(p^{21})
 \end{align*}
 and indeed the lowest order is $\diam{C}=9$.
+~
 A weaker version of the claim is that if $C$ contains a gap of size $k$, then the sum is zero up to and including order $p^{k-1}$.
+A weaker version of the claim is that if $C$ contains a gap of size $k$, then the sum is zero up to and including order $p^{|C|+k-1}$.
 \begin{claim}[Weak cancellation claim] \label{claim:weakcancel}
 	For $C\subseteq[n]$ a configuration of slot positions, the lowest order term in
     \begin{align*}
         \sum_{f\in\{0,1'\}^{|C|}} \rho_{C(f)} R_{C(f)} ,
     \end{align*}
 	is at least $p^{\mathrm{gap}(C)}$ when $n$ is large enough. Here $\mathrm{gap}(C)$ is defined as in Figure \ref{fig:diametergap}, its the size of the largest gap of $C$ within the diameter of $C$. All lower order terms cancel out.
+	is at least $p^{|C|+\mathrm{gap}(C)}$ when $n$ is large enough. Here $\mathrm{gap}(C)$ is defined as in Figure \ref{fig:diametergap}, its the size of the largest gap of $C$ within the diameter of $C$. All lower order terms cancel out.
 \end{claim}
 This weaker version would imply \ref{it:const} but for $\mathcal{O}(k^2)$ as opposed to $k+1$.
 \newpage
 The reason that claim \ref{claim:strongcancel} would prove \ref{it:const} is the following:
 For a starting configuration that \emph{does} give a nonzero contribution, you can take that same starting configuration and translate it to get $n$ other configurations that give the same contribution. Therefore the coefficient in the expected number of resamplings is a multiple of $n$ which Andr\'as already divided out in the definition of $R^{(n)}(p)$. To show \ref{it:const} we argue that this is the \emph{only} dependency on $n$. This is because there are only finitely many (depending on $k$ but not on $n$) configurations where the $k$ slots are nearby regardless of the value of $n$. So there are only finitely many nonzero contributions after translation symmetry was taken out. For example, when considering all starting configurations with 5 slots one might think there are $\binom{n}{5}$ configurations to consider which would be a dependency on $n$ (more than only the translation symmetry). But since most of these configurations have a diameter larger than $k$, they do not contribute to $a_k$. Only finitely many do and that does not depend on $n$.
+~
 Section \ref{sec:computerb} shows how to compute $R_b$ (this is not relevant for showing the claim) and the section after that shows how to prove the weaker claim.
 \newpage
 \subsection{Computation of $R_b$} \label{sec:computerb}
 By $R_{101}$ we denote $R_b(p)$ for a $b$ that consists of only $1$s except for a single zero. We compute $R_{101}$ up to second order in $p$. This requires the following transitions.
 \begin{align*}
     \framebox{$1 0 1$} &\to \framebox{$1 1 1$} & (1-p)^3 = 1-3p+3p^2-p^3\\
     \hline
     \framebox{$1 0 1$} &\to
         \begin{cases}
             \framebox{$0 1 1$}\\
             \framebox{$1 0 1$}\\
             \framebox{$1 1 0$}
         \end{cases}
     R_{101} &= (1-3p+3p^2 - p^3)(1) + (3p -6p^2 +3p^3) (1+R_{101}) \\
             &\quad + (p^2 - p^3) (1+R_{10101}) + (2p^2-2p^3) (1+R_{1001}) \\
 			&= 1 + 3 p + 7 p^2 + 14.6667 p^3 + 29 p^4 + 55.2222 p^5 + 102.444 p^6 + 186.36 p^7 \\
             &\quad + 333.906 p^8 + 590.997 p^9 + 1035.58 p^{10} + 1799.39 p^{11} + 3104.2 p^{12} \\
             &\quad+ 5322.18 p^{13} + 9075.83 p^{14} + 15403.6 p^{15} + 26033.4 p^{16} + 43833.5 p^{17} \\
             &\quad+ 73555.2 p^{18} + 123053 p^{19} + 205290 p^{20} + 341620 p^{21} + 567161 p^{22} \\
             &\quad+ 939693 p^{23} + 1.5537\cdot10^{6} p^{24} + 2.56158\cdot10^{6} p^{25} + \mathcal{O}(p^{26})
 \end{align*}
 where the recursion steps were done with a computer. This assumes $n$ to be much larger than the largest power of $p$ considered.
 Note: in the first line at the second term it uses that with probability $(3p-6p^2)$ the state goes to $\framebox{$101$}$ and then the expected number of resamplings is $1+R_{101}$. I (Tom) believe this requires the assumption $p_\mathrm{tot} := \sum_{\xi\in\paths{b}} \mathbb{P}[\xi] = 1$. To see why this is required, note that the actual term in the recursive formula should be $$(3p-6p^2)\cdot\left( \sum_{\xi\in\paths{101}} \mathbb{P}[\xi] \cdot \left( 1 + |\xi|\right) \right) = (3p-6p^2)\left( p_\mathrm{tot} + R_{101} \right)$$
 When there would be a non-zero probability of never stopping the resample process then $p_\mathrm{tot}$ (the probability of ever reaching $\mathbf{1}$) could be less than one. Therefore I assume that $R^{(n)}(p)$ is finite which implies that the probability of ever reaching $\mathbf{1}$ is 1.
 \newpage
 \subsection{Cancellation of gapped configurations}
 Here we prove claim \ref{claim:weakcancel}, the weaker version of the claim. We require the following definition
 \begin{definition}[Path independence] \label{def:independence}
 	We say two paths $\xi_i\in\paths{b_i}$ ($i=1,2$) of the Markov Chain are \emph{independent} if $\xi_1$ never resamples a site that was ever zero in $\xi_2$ and the other way around. It is allowed that $\xi_1$ resamples a $1$ to a $1$ that was also resampled from $1$ to $1$ by $\xi_2$ and vice versa. If the paths are not independent then we call the paths \emph{dependent}.
 \end{definition}
 The key ingredient of the proof is the following claim:
 \begin{claim}[Sum of expectation values] \label{claim:expectationsum}
 When $b=b_1\land b_2\in\{0,1\}^n$ is a state with two groups ($b_1\lor b_2 = 1^n$) of zeroes with $k$ $1$s inbetween the groups, then we have $R_b(p) = R_{b_1}(p) + R_{b_2}(p) + \mathcal{O}(p^{k})$ where $b_1$ and $b_2$ are the configurations where only one of the groups is present and the other group has been replaced by $1$s. To be precise, the sums agree up to and including order $p^{k-1}$.
 \end{claim}
 For example for $b_1 = 10111111$ and $b_2 = 11111000$ we have $b=10111000$ and $k=3$. The claim says that the expected time to reach $\mathbf{1}$ from $b$ is the time to make the first group $1$ plus the time to make the second group $1$, as if they are independent. When going up to order $p^{k}$ or higher, there will be terms where the groups interfere so they are no longer independent.
 \textbf{Example}: For $b_1 = 0111111$ and $b_2 = 1111010$ we have $b=0111010$ and $k=3$. The claim says that the expected time to reach $\mathbf{1}$ from $b$ is the time to make the first group $1$ plus the time to make the second group $1$, as if they are independent. Simulation shows that
 \begin{align*}
     R_{b_1} &= 1 + 3p + 7p^2 + 14.67p^3 + 29p^4 + \mathcal{O}(p^5)\\
     R_{b_2} &= 2 + 5p + 10.67p^2 + 21.11p^3+40.26p^4 + \mathcal{O}(p^5)\\
     R_{b} &= 3 + 8p + 17.67p^2 + 34.78p^3+65.27p^4 + \mathcal{O}(p^5)\\
     R_{b_1} + R_{b_2} &= 3 + 8p + 17.67p^2+35.78p^3 + 69.26p^4 +\mathcal{O}(p^5)
 \end{align*}
 and indeed the sums agree up to order $p^{k-1}=p^2$. When going up to order $p^{k}$ or higher, there will be terms where the groups interfere so they are no longer independent.
+~
 \begin{proof}
 Consider a path $\xi_1\in\paths{b_1}$ and a path $\xi_2\in\paths{b_2}$ such that $\xi_1$ and $\xi_2$ are independent (Definition \ref{def:independence}). The paths $\xi_1,\xi_2$ induce $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ different paths of total length $|\xi_1|+|\xi_2|$ in $\paths{b_1\land b_2}$. In the sums $R_{b_1}$ and $R_{b_2}$, the contribution of these paths are $\mathbb{P}[\xi_1]\cdot |\xi_1|$ and $\mathbb{P}[\xi_2]\cdot |\xi_2|$. The next diagram shows how these $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ paths contribute to $R_{b_1\land b_2}$. At every step one has to choose between doing a step of path 1 or a step of path 2. The number of zeroes in the current state determine probabilities with which this happens (aside from the probabilities associated to the two original paths already). The grid below shows that at every point one can choose to do a step of path 1 with probability $p_i$ or a step of path 2 with probability $1-p_i$. These $p_i$ could in principle be different at every point in this grid. The weight of such a new path is the weight of the path in the diagram below, multiplied by $\mathbb{P}[\xi_1]\cdot\mathbb{P}[\xi_2]$. By induction one can show that the sum over all $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ paths in the grid is $1$. Hence the contribution of all $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ paths together to $R_{b_1\land b_2}$ is given by
 Consider a path $\xi_1\in\paths{b_1}$ and a path $\xi_2\in\paths{b_2}$ such that $\xi_1$ and $\xi_2$ are independent (Definition \ref{def:independence}). The paths $\xi_1,\xi_2$ induce $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ different paths of total length $|\xi_1|+|\xi_2|$ in $\paths{b_1\land b_2}$. In the sums $R_{b_1}$ and $R_{b_2}$, the contribution of these paths are $\mathbb{P}[\xi_1]\cdot |\xi_1|$ and $\mathbb{P}[\xi_2]\cdot |\xi_2|$. The next diagram shows how these $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ paths contribute to $R_{b_1\land b_2}$. At every step one has to choose between doing a step of $\xi_1$ or a step of $\xi_2$. The number of zeroes in the current state determine the probabilities with which this happens (beside the probabilities associated to the two original paths already). The grid below shows that at every point one can choose to do a step of $\xi_1$ with probability $p_i$ or a step of $\xi_2$ with probability $1-p_i$. These $p_i$ could in principle be different at every point in this grid.
 \begin{center}
 \includegraphics{diagram_paths.pdf}
 \end{center}
 The weight of such a new path is the weight of the path in the diagram, multiplied by $\mathbb{P}[\xi_1]\cdot\mathbb{P}[\xi_2]$. By induction one can show that the sum over all $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ paths in the grid is $1$. Hence the contribution of all $\binom{|\xi_1|+|\xi_2|}{|\xi_1|}$ paths together to $R_{b_1\land b_2}$ is given by
 \[
 \mathbb{P}[\xi_1]\cdot\mathbb{P}[\xi_2]\cdot(|\xi_1|+|\xi_2|) = \mathbb{P}[\xi_2]\cdot\mathbb{P}[\xi_1]\cdot|\xi_1| \;\; + \;\; \mathbb{P}[\xi_1]\cdot\mathbb{P}[\xi_2]\cdot|\xi_2|.
 \]
 Ideally we would now like to sum this expression over all possible paths $\xi_1,\xi_2$ and use $p_\mathrm{tot}:=\sum_{\xi\in\paths{b_i}} \mathbb{P}[\xi] = 1$ (which also holds up to arbitrary order in $p$). The above expression would then become $R_{b_1} + R_{b_2}$. However, not all paths in the sum would satisfy the independence condition so it seems we can't do this. We now argue that it works up to order $p^{k-1}$.
 For all $\xi\in\paths{b_1\land b_2}$ we have that \emph{either} $\xi$ splits into two independent paths $\xi_1,\xi_2$ as above, \emph{or} it does not. In the latter case, when $\xi$ can not be split like that, we know $\mathbb{P}[\xi]$ contains a power $p^k$ or higher because there is a gap of size $k$  and the paths must have moved at least $k$ times `towards each other' (for example one path moves $m$ times to the right and the other path moves $k-m$ times to the left). So the total weight of such a combined path is at least order $p^k$. Therefore we have
 \[
 	R_{b_1\land b_2} = \sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1| + \sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_1]\mathbb{P}[\xi_2]|\xi_2| + \sum_{\mathclap{\xi\;\mathrm{dependent}}} \mathbb{P}[\xi]|\xi|.
 \]
 where last sum only contains only terms of order $p^{k}$ or higher. Now for the first sum, note that
 \[
 	\sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1|
     = \sum_{\xi_1\in\paths{b_1}} \sum_{\substack{\xi_2\in\paths{b_2}\\ \text{independent of }\xi_1}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1|
 \]
 where the sum over independent paths could be empty for certain $\xi_1$. Now we replace this last sum by a sum over \emph{all} paths $\xi_2\in\paths{b_2}$. This will change the sum but only for terms where $\xi_1,\xi_2$ are dependent. For those terms we already know that $\mathbb{P}[\xi_1]\mathbb{P}[\xi_2]$ contains a factor $p^k$ and hence we have
 \begin{align*}
     \sum_{\mathclap{\substack{\xi_{1,2}\in\paths{b_{1,2}}\\ \mathrm{independent}}}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1|
     &= \sum_{\xi_1\in\paths{b_1}} \sum_{\xi_2\in\paths{b_2}} \mathbb{P}[\xi_2]\mathbb{P}[\xi_1]|\xi_1| + \mathcal{O}(p^k) \\
     &= \sum_{\xi_1\in\paths{b_1}} \mathbb{P}[\xi_1]|\xi_1| + \mathcal{O}(p^k) \\
     &= R_{b_1} + \mathcal{O}(p^k)
 \end{align*}
 we can do the same with the second term and this proves the claim.
 \end{proof}
 \begin{center}
 \includegraphics{diagram_paths.pdf}
 \end{center}
 \textbf{Proof of claim \ref{claim:weakcancel}}: Say we have a group on the left with $l$ slots and a group on the right with $r$ slots, with enough space between the groups. Then on the left we have strings in $\{0,1'\}^l$ as possibilities and on the right we have strings in $\{0,1'\}^r$. The combined configuration can be described by strings $(a,b)\in\{0,1'\}^{l+r}$. Such a configuration has probability $(-1)^{|a|+|b|} p^{r+l}$ in $\rho$ and by claim \ref{claim:expectationsum} we know $R_{(a,b)} = R_a + R_b + \mathcal{O}(p^\mathrm{spacing})$. The total contribution of these configurations is therefore
 ~\\
 \textbf{Proof of claim \ref{claim:weakcancel}}: We can assume $C$ consists of a group on the left with $l$ slots and a group on the right with $r$ slots (so $r+l=|C|$), with a gap of size $k=\mathrm{gap}(C)$ between these groups. Then on the left we have strings in $\{0,1'\}^l$ as possibilities and on the right we have strings in $\{0,1'\}^r$. The combined configuration can be described by strings $f=(a,b)\in\{0,1'\}^{l+r}$. The initial probability of such a state $C(a,b)$ is $\rho_{C(a,b)} = (-1)^{|a|+|b|} p^{r+l}$ and by claim \ref{claim:expectationsum} we know $R_{C(a,b)} = R_{C(a)} + R_{C(b)} + \mathcal{O}(p^k)$ where $C(a)$ indicates that only the left slots have been filled by $a$ and the other slots are filled with $1$s. The total contribution of these configurations is therefore
 \begin{align*}
 	\sum_{a\in\{0,1'\}^l} \sum_{b\in\{0,1'\}^r} (-1)^{|a|+|b|}p^{r+l} \left( R_a + R_b \right) + \mathcal{O}(p^\mathrm{spacing})
     &= p^{r+l}\sum_{a\in\{0,1'\}^l} (-1)^{|a|} R_a \sum_{b\in\{0,1'\}^r} (-1)^{|b|} \\
     &\quad + p^{r+l}\sum_{b\in\{0,1'\}^r} (-1)^{|b|} R_b \sum_{a\in\{0,1'\}^l} (-1)^{|a|} \\
     &\quad + \mathcal{O}(p^\mathrm{spacing})\\
     &= 0 + \mathcal{O}(p^\mathrm{spacing})
     \sum_{f\in\{0,1'\}^{|C|}} \rho_{C(f)} R_{C(f)}
     &= \sum_{a\in\{0,1'\}^l} \sum_{b\in\{0,1'\}^r} (-1)^{|a|+|b|}p^{r+l} \left( R_{C(a)} + R_{C(b)} + \mathcal{O}(p^k) \right) \\
     &=\;\;\; p^{r+l}\sum_{a\in\{0,1'\}^l} (-1)^{|a|} R_{C(a)} \sum_{b\in\{0,1'\}^r} (-1)^{|b|} \\
     &\quad + p^{r+l}\sum_{b\in\{0,1'\}^r} (-1)^{|b|} R_{C(b)} \sum_{a\in\{0,1'\}^l} (-1)^{|a|}
         + \mathcal{O}(p^{r+l+k})\\
     &= 0 + \mathcal{O}(p^{|C|+k})
 \end{align*}
 where we used the identity $\sum_{a\in\{0,1\}^l} (-1)^{|a|} = 0$.
 \newpage
     \subsection{Sketch of the (false) proof of the linear bound \ref{it:const}}
     Let us interpret $[n]$ as the vertices of a length-$n$ cycle, and interpret operations on vertices mod $n$ s.t. $n+1\equiv 1$ and $1-1\equiv n$.
     %\begin{definition}[Resample sequences]
     %	A sequence of indices $(r_\ell)=(r_1,r_2,\ldots,r_k)\in[n]^k$ is called resample sequence if our procedure performs $k$ consequtive resampling, where the first resampling of the procedure resamples around the mid point $r_1$ the second around $r_2$ and so on. Let $RS(k)$ the denote the set of length $k$ resample sequences, and let $RS=\cup_{k\in\mathbb{N}}RS(k)$.
     %\end{definition}
     %\begin{definition}[Constrained resample sequence]\label{def:constrainedRes}
     %	Let $C\subseteq[n]$ denote a slot configuration, and let $a\in\{\text{res},\neg\text{res}\}^{n-|C|}$, where the elements correspond to labels ``resampled" vs. ``not resampled" respectively.
     %	For $j\in[n-|C|]$ let $i_j$ denote the $j$-th index in $[n]\setminus C$.
     %	We define the set $A^{(C,a)}\subseteq RS$ as the set of resample sequences $(r_\ell)$ such that for all $j$ which has $a_j=\text{res}$ we have that $i_j$ appears in $(r_\ell)$ but for $j'$-s which have $a_{j'}=\neg\text{res}$ we have that $i_{j'}$ never appears in $(r_\ell)$.
     %\end{definition}
     \begin{definition}[Conditional expected number of resamples]
     	For a slot configuration $C\subseteq[n]$ and $a\in\{\!\text{ever},\text{ never}\}^{n-|C|}$ we define the event $A^{(C,a)}:=\bigwedge_{j\in[n-|C|]}\{i_j\text{ has }a_j\text{ become }0\text{ before reaching }\mathbf{1}\}$,
     	where $i_j$ is the $j$-th vertex of $[n]\setminus C$.
     	Then we also define
     	$$R^{(C,a)}_b:=\mathbb{E}[\#\{\text{resamplings when started from inital state }b\}|A^{(C,a)}].$$
     \end{definition}
     As in Mario's proof I use the observation that
     \begin{align*}
     R^{(n)}(p) &= \frac{1}{n}\sum_{b\in\{0,1,1'\}^{n}} \rho_b \; R_{\bar{b}}(p)\\
     &= \frac{1}{n}\sum_{C\subseteq [n]}\sum_{f\in\{0,1'\}^{|C|}} \rho_{C(f)} R_{C(f)}(p)\\
     &= \frac{1}{n}\sum_{C\subseteq [n]}\sum_{f\in\{0,1'\}^{|C|}}\sum_{a\in\{\!\text{ever},\text{ never}\}^{n-|C|}} \rho_{C(f)} R^{{(C,a)}}_{C(f)}(p)P_{C(f)}(A^{(C,a)})\\
     &= \frac{1}{n}\sum_{C\subseteq [n]}\sum_{a\in\{\!\text{ever},\text{ never}\}^{n-|C|}} \sum_{f\in\{0,1'\}^{|C|}} \rho_{C(f)} R^{{(C,a)}}_{C(f)}(p)P_{C(f)}(A^{(C,a)}),
     \end{align*}

0 comments (0 inline, 0 general)