Files
HonorThesis/presentation/ZheyuanWu_HonorThesis_Presentation.tex
Zheyuan Wu e6e5104de2 updates
2026-03-23 02:03:17 -05:00

672 lines
20 KiB
TeX

\documentclass[11pt]{beamer}
\usetheme{Madrid}
\usecolortheme{beaver}
\usefonttheme{serif}
\usepackage[utf8]{inputenc}
\usepackage[english]{babel}
\usepackage[T1]{fontenc}
\usepackage{amsmath}
\usepackage{amsfonts}
\usepackage{amssymb}
\usepackage{mathrsfs}
\usepackage{mathtools}
\usepackage{graphicx}
\usepackage{tabularx}
\usepackage{colortbl}
\usepackage{tikz}
\DeclareMathOperator{\sen}{sen}
\DeclareMathOperator{\tg}{tg}
\DeclareMathOperator{\obdiam}{ObsDiam}
\DeclareMathOperator{\diameter}{diam}
\setbeamertemplate{caption}[numbered]
\author[Zheyuan Wu]{Zheyuan Wu}
\title{Measure concentration in complex projective space and quantum entanglement}
\newcommand{\email}{w.zheyuan@wustl.edu}
\setbeamertemplate{navigation symbols}{}
\setbeamertemplate{footline}
{
\leavevmode%
\hbox{%
\begin{beamercolorbox}[wd=.15\paperwidth,ht=2.25ex,dp=1ex,center]{author in head/foot}%
\usebeamerfont{author in head/foot}\insertshortauthor
\end{beamercolorbox}%
\begin{beamercolorbox}[wd=.6\paperwidth,ht=2.25ex,dp=1ex,center]{title in head/foot}%
\usebeamerfont{title in head/foot}\insertsectionhead
\end{beamercolorbox}%
\begin{beamercolorbox}[wd=.15\paperwidth,ht=2.25ex,dp=1ex,center]{date in head/foot}%
\usebeamerfont{author in head/foot}\insertshortdate
\end{beamercolorbox}%
\begin{beamercolorbox}[wd=.1\paperwidth,ht=2.25ex,dp=1ex,center]{institute in head/foot}%
\insertframenumber{} / \inserttotalframenumber\hspace*{1ex}
\end{beamercolorbox}}%
\vskip0pt%
}
\setbeamercolor{block title}{fg=white, bg=red!50!black!60}
\setbeamercolor{block body}{fg=black, bg=red!5}
\setbeamercolor{item}{fg=red!60!black}
\setbeamercolor{section number projected}{fg=white, bg=red!70!black}
\institute[]{Washington University in St. Louis}
\date{\today}
\begin{document}
\begin{frame}
\titlepage
\end{frame}
\begin{frame}{Table of Contents}
\hypersetup{linkcolor=black}
\tableofcontents
\end{frame}
\section{Motivation}
\begin{frame}{Light polarization and non-commutative probability}
\begin{figure}
\includegraphics[width=0.6\textwidth]{../latex/images/Filter_figure.png}
\end{figure}
\begin{itemize}
\item Light passing through a polarizer becomes polarized in the direction of that filter.
\item If two filters are placed with relative angle $\alpha$, the transmitted intensity decreases as $\alpha$ increases.
\item In particular, the transmitted intensity vanishes when $\alpha=\pi/2$.
\end{itemize}
\end{frame}
\begin{frame}{Polarization experiment}
\vspace{0.5em}
Now consider three filters $F_1,F_2,F_3$ with directions
$$
\alpha_1,\alpha_2,\alpha_3.
$$
Testing them pairwise suggests introducing three $0$--$1$ random variables
$$
P_1,P_2,P_3,
$$
where $P_i=1$ means that the photon passes filter $F_i$.
\vspace{0.5em}
If these were classical random variables on one probability space, they would satisfy a Bell-type inequality.
\end{frame}
\begin{frame}{A classical Bell-type inequality}
\begin{block}{Bell-type inequality}
For any classical random variables $P_1,P_2,P_3\in\{0,1\}$,
$$
\operatorname{Prob}(P_1=1,P_3=0)
\leq
\operatorname{Prob}(P_1=1,P_2=0)
+
\operatorname{Prob}(P_2=1,P_3=0).
$$
\end{block}
\vspace{0.5em}
\begin{proof}
The event $\{P_1=1,P_3=0\}$ splits into two disjoint cases according to whether $P_2=0$ or $P_2=1$:
$$
\{P_1=1,P_3=0\}
=
\{P_1=1,P_2=0,P_3=0\}
\sqcup
\{P_1=1,P_2=1,P_3=0\}.
$$
Therefore,
$$
\begin{aligned}
\operatorname{Prob}(P_1=1,P_3=0)
&=
\operatorname{Prob}(P_1=1,P_2=0,P_3=0) \\
&\quad+
\operatorname{Prob}(P_1=1,P_2=1,P_3=0) \\
&\leq
\operatorname{Prob}(P_1=1,P_2=0)
+
\operatorname{Prob}(P_2=1,P_3=0).
\end{aligned}
$$
\end{proof}
\end{frame}
\begin{frame}{Experimental law}
For unpolarized incoming light, the \textbf{observed transition law} for a pair of filters is
$$
\operatorname{Prob}(P_i=1,P_j=0)
=
\operatorname{Prob}(P_i=1)-\operatorname{Prob}(P_i=1,P_j=1).
$$
Using the polarization law,
$$
\operatorname{Prob}(P_i=1)=\frac12,
\qquad
\operatorname{Prob}(P_i=1,P_j=1)=\frac12\cos^2(\alpha_i-\alpha_j),
$$
hence
$$
\operatorname{Prob}(P_i=1,P_j=0)
=
\frac12-\frac12\cos^2(\alpha_i-\alpha_j)
=
\frac12\sin^2(\alpha_i-\alpha_j).
$$
\vspace{0.5em}
So the experimentally observed probabilities depend only on the angle difference $\alpha_i-\alpha_j$.
\end{frame}
\begin{frame}{Violation of the classical inequality}
Substituting the experimental law into the classical inequality gives
$$
\frac12\sin^2(\alpha_1-\alpha_3)
\leq
\frac12\sin^2(\alpha_1-\alpha_2)
+
\frac12\sin^2(\alpha_2-\alpha_3).
$$
Choose
$$
\alpha_1=0,\qquad
\alpha_2=\frac{\pi}{6},\qquad
\alpha_3=\frac{\pi}{3}.
$$
Then
$$
\begin{aligned}
\frac12\sin^2\!\left(-\frac{\pi}{3}\right)
&\leq
\frac12\sin^2\!\left(-\frac{\pi}{6}\right)
+
\frac12\sin^2\!\left(-\frac{\pi}{6}\right) \\
\frac38 &\leq \frac18+\frac18 \\
\frac38 &\leq \frac14,
\end{aligned}
$$
which is false.
\vspace{0.5em}
Therefore the pairwise polarization data cannot come from one classical probability model with random variables $P_1,P_2,P_3$.
\end{frame}
\begin{frame}{The quantum model of polarization}
The correct model uses a Hilbert space rather than classical events.
\begin{itemize}
\item A pure polarization state is a vector
$$
\psi=\alpha|0\rangle+\beta|1\rangle \in \mathbb{C}^2.
$$
\item A filter at angle $\alpha$ is represented by the orthogonal projection
$$
P_\alpha=
\begin{pmatrix}
\cos^2\alpha & \cos\alpha\sin\alpha \\
\cos\alpha\sin\alpha & \sin^2\alpha
\end{pmatrix}.
$$
\item For a pure state $\psi$, the probability of passing the filter is
$$
\langle P_\alpha\psi,\psi\rangle.
$$
\end{itemize}
\vspace{0.4em}
The key point is that sequential measurements are described by \emph{ordered products} of projections, and these need not commute.
\end{frame}
\begin{frame}{Recovering the observed law from the operator model}
Assume the incoming light is unpolarized, so its state is the density matrix
$$
\rho=\frac12 I.
$$
The probability of passing the first filter $P_{\alpha_i}$ is
$$
\operatorname{Prob}(P_i=1)
=
\operatorname{tr}(\rho P_{\alpha_i})
=
\frac12\operatorname{tr}(P_{\alpha_i})
=
\frac12.
$$
If the photon passes the first filter, the post-measurement state is
$$
\rho_i
=
\frac{P_{\alpha_i}\rho P_{\alpha_i}}{\operatorname{tr}(\rho P_{\alpha_i})}
=
P_{\alpha_i}.
$$
$$
P_\alpha=
\begin{pmatrix}
\cos^2\alpha & \cos\alpha\sin\alpha \\
\cos\alpha\sin\alpha & \sin^2\alpha
\end{pmatrix}.
$$
Therefore
$$
\operatorname{Prob}(P_j=1\mid P_i=1)
=
\operatorname{tr}(\rho_i P_{\alpha_j})
=
\operatorname{tr}(P_{\alpha_i}P_{\alpha_j})
=
\cos^2(\alpha_i-\alpha_j).
$$
\end{frame}
\begin{frame}{Recovering the observed law from the operator model (cont.)}
$$
\begin{aligned}
\operatorname{Prob}(P_i=1,P_j=0)
&=
\operatorname{Prob}(P_i=1)
\bigl(1-\operatorname{Prob}(P_j=1\mid P_i=1)\bigr) \\
&=
\frac12\bigl(1-\cos^2(\alpha_i-\alpha_j)\bigr) \\
&=
\frac12\sin^2(\alpha_i-\alpha_j).
\end{aligned}
$$
This matches the experiment exactly.
\end{frame}
\begin{frame}{Conclusion}
\begin{itemize}
\item The classical model predicts a Bell-type inequality for three $0$--$1$ random variables.
\item The polarization experiment violates that inequality.
\item The resolution is that the quantities measured are \emph{sequential probabilities}, not joint probabilities of classical random variables.
\item In quantum probability, events are modeled by projections on a Hilbert space, and measurement order matters.
\end{itemize}
\vspace{0.6em}
This is one of the basic motivations for passing from classical probability to non-commutative probability.
\end{frame}
\section{Concentration on Spheres and quantum states}
\begin{frame}{Quantum states: pure vs.\ mixed}
\begin{itemize}
\item A finite-dimensional quantum system is modeled by a complex Hilbert space (a complete inner product space)
$$
\mathcal H \cong \mathbb C^{n+1}.
$$
\item A \textbf{pure state} is represented by a unit vector
$$
\psi \in \mathcal H, \qquad \|\psi\|=1.
$$
\item A \textbf{mixed state} is represented by a density matrix
$$
\rho \geq 0, \qquad \operatorname{tr}(\rho)=1.
$$
\item Pure states describe maximal information; mixed states describe probabilistic mixtures or partial information.
\end{itemize}
\vspace{0.4em}
\begin{block}{Key distinction}
Pure states form a curved geometric space; mixed states form a convex set inside the space of matrices.
\end{block}
\end{frame}
\begin{frame}{Why pure states are not vectors}
\begin{itemize}
\item Two nonzero vectors that differ by a nonzero complex scalar represent the same physical state:
$$
\psi \sim \lambda \psi, \qquad \lambda \in \mathbb C^\times.
$$
\item In particular, multiplying by a phase $e^{i\theta}$ does not change any physical predictions.
\item Therefore the physical pure state is not a single vector, but the \emph{complex line} spanned by that vector.
\end{itemize}
\vspace{0.4em}
Hence the space of pure states is
$$
\mathbb P(\mathcal H)
=
(\mathcal H \setminus \{0\})/\mathbb C^\times.
$$
After choosing a basis $\mathcal H \cong \mathbb C^{n+1}$, this becomes
$$
\mathbb P(\mathcal H) \cong \mathbb C P^n.
$$
\end{frame}
\begin{frame}{Relation with the sphere}
\begin{itemize}
\item Every nonzero vector can be normalized, so each pure state has a representative on the unit sphere
$$
S^{2n+1} \subset \mathbb C^{n+1}.
$$
\item Two unit vectors represent the same pure state exactly when they differ by a phase:
$$
z \sim e^{i\theta} z.
$$
\item Therefore
$$
\mathbb C P^n = S^{2n+1}/S^1.
$$
\end{itemize}
\vspace{0.4em}
The quotient map
$$
p:S^{2n+1}\to \mathbb C P^n, \qquad p(z)=[z]=\{\lambda z : \lambda \in \mathbb C^\times\},
$$
is the \textbf{Hopf fibration}.
\end{frame}
\begin{frame}{How the metric descends to $\mathbb C P^n$}
\begin{itemize}
\item The sphere $S^{2n+1}$ inherits the round metric from the Euclidean metric on
$$
\mathbb C^{n+1} \cong \mathbb R^{2n+2}.
$$
\item The fibers of the Hopf map are circles
$$
p^{-1}([z]) = \{e^{i\theta}z : \theta \in \mathbb R\}.
$$
\item Tangent vectors split into:
\begin{itemize}
\item \textbf{vertical directions}: tangent to the $S^1$-fiber,
\item \textbf{horizontal directions}: orthogonal complement to the fiber.
\end{itemize}
\item The differential $dp$ identifies horizontal vectors on the sphere with tangent vectors on $\mathbb C P^n$.
\end{itemize}
\vspace{0.4em}
This allows the round metric on $S^{2n+1}$ to define a metric on $\mathbb C P^n$.
\end{frame}
\begin{frame}{The induced metric: Fubini--Study metric}
\begin{itemize}
\item The metric on $\mathbb C P^n$ obtained from the Hopf quotient is the
\textbf{Fubini--Study metric}.
\item So the geometric picture is:
$$
S^{2n+1}
\xrightarrow{\text{Hopf fibration}}
\mathbb C P^n
$$
$$
\text{round metric}
\rightsquigarrow
\text{Fubini--Study metric}.
$$
\item The normalized Riemannian volume measure induced by this metric gives the natural probability measure on pure states.
\end{itemize}
\vspace{0.5em}
\begin{block}{Proof roadmap}
To prove this carefully, one usually shows:
\begin{enumerate}
\item $p:S^{2n+1}\to \mathbb C P^n$ is a smooth surjective submersion,
\item the vertical space is the tangent space to the $S^1$-orbit,
\item horizontal lifts are well defined,
\item the quotient metric is exactly the Fubini--Study metric.
\end{enumerate}
\end{block}
\end{frame}
\begin{frame}{Maxwell-Boltzmann Distribution Law}
\begin{columns}[T]
\column{0.58\textwidth}
Consider the orthogonal projection
$$
\pi_{n,k}:S^n(\sqrt{n})\to \mathbb{R}^k.
$$
Its push-forward measure converges to the standard Gaussian:
$$
(\pi_{n,k})_*\sigma^n\to \gamma^k.
$$
\vspace{0.5em}
This explains why Gaussian behavior emerges from high-dimensional spheres and supports the proof strategy for Levy concentration.
\column{0.42\textwidth}
\begin{figure}
\includegraphics[width=\textwidth]{../latex/images/maxwell.png}
\end{figure}
\end{columns}
\end{frame}
\begin{frame}{Levy Concentration}
\begin{block}{Levy's theorem}
If $f:S^n\to \mathbb{R}$ is $1$-Lipschitz, then there exists a median $a_0$ such that
$$
\mu\{x\in S^n:|f(x)-a_0|\geq \epsilon\}
\leq
2\exp\left(-\frac{(n-1)\epsilon^2}{2}\right).
$$
\end{block}
\begin{itemize}
\item In high dimension, most Lipschitz observables are almost constant.
\item This is the geometric mechanism behind generic entanglement.
\end{itemize}
\end{frame}
\section{Main Result}
\begin{frame}{Generic Entanglement Theorem}
\begin{block}{Hayden--Leung--Winter}
Let $\psi\in \mathcal{P}(A\otimes B)$ be Haar-random and define
$$
\beta=\frac{1}{\ln(2)}\frac{d_A}{d_B}.
$$
For $d_B\geq d_A\geq 3$,
$$
\operatorname{Pr}[H(\psi_A)<\log_2(d_A)-\alpha-\beta]
\leq
\exp\left(
-\frac{1}{8\pi^2\ln(2)}
\frac{(d_Ad_B-1)\alpha^2}{(\log_2 d_A)^2}
\right).
$$
\end{block}
With overwhelming probability, a random pure state is almost maximally entangled.
\end{frame}
\begin{frame}{How the Entropy Observable Fits In}
\begin{figure}
\centering
\begin{tikzpicture}[node distance=30mm, thick,
main/.style={draw, draw=white},
towards/.style={->},
towards_imp/.style={->,red},
mutual/.style={<->}
]
\node[main] (cp) {$\mathbb{C}P^{d_A d_B-1}$};
\node[main] (pa) [left of=cp] {$\mathcal{P}(A\otimes B)$};
\node[main] (sa) [below of=pa] {$\mathcal{S}(A)$};
\node[main] (rng) [right of=sa] {$[0,\log_2 d_A]$};
\draw[mutual] (cp) -- (pa);
\draw[towards] (pa) -- node[left] {$\operatorname{Tr}_B$} (sa);
\draw[towards_imp] (pa) -- node[above right] {$\psi\mapsto H(\psi_A)$} (rng);
\draw[towards] (sa) -- node[above] {$H$} (rng);
\end{tikzpicture}
\end{figure}
\begin{itemize}
\item The red arrow is the observable to which concentration is applied.
\item The projective description is natural because global phase does not change the physical state.
\end{itemize}
\end{frame}
\begin{frame}{Ingredients Behind the Tail Bound}
\begin{block}{Page-type lower bound}
$$
\mathbb{E}[H(\psi_A)]
\geq
\log_2(d_A)-\frac{1}{2\ln(2)}\frac{d_A}{d_B}.
$$
\end{block}
\begin{block}{Lipschitz estimate}
$$
\|H(\psi_A)\|_{\mathrm{Lip}}
\leq
\sqrt{8}\,\log_2(d_A),
\qquad d_A\geq 3.
$$
\end{block}
Levy concentration plus these two estimates produces the exponential entropy tail bound.
\end{frame}
\section{Geometry of State Space}
\begin{frame}{Observable diameter: the inner definition}
\begin{block}{Partial diameter on $\mathbb{R}$}
Let $\nu$ be a Borel probability measure on $\mathbb{R}$ and let $\alpha \in (0,1]$.
The \textbf{partial diameter} of $\nu$ at mass level $\alpha$ is
$$
\diameter(\nu;\alpha):=
\{\diameter(A):A \subseteq \mathcal{B}(\mathbb{R}),
\nu(A)\ge \alpha
\},
$$
where
$$
\diameter(A):=\sup_{x,y\in A}|x-y|.
$$
\end{block}
\vspace{0.4em}
\begin{itemize}
\item This asks for the shortest interval-like region containing at least $\alpha$ of the total mass.
\item So $\diameter(\nu;1-\kappa)$ measures how tightly we can capture \emph{most} of the distribution, allowing us to discard a set of mass at most $\kappa$.
\end{itemize}
\end{frame}
\begin{frame}{Observable diameter of a metric-measure space}
\begin{block}{Definition}
Let $X=(X,d_X,\mu_X)$ be a metric-measure space and let $\kappa>0$.
The \textbf{observable diameter} of $X$ is
$$
\obdiam_{\mathbb{R}}(X;-\kappa)
:=
\sup_{f\in \operatorname{Lip}_1(X,\mathbb{R})}
\diameter(f_*\mu_X;1-\kappa),
$$
where $\operatorname{Lip}_1(X,\mathbb{R})$ is the set of all $1$-Lipschitz functions
$f:X\to\mathbb{R}$, and $f_*\mu_X$ is the pushforward measure on $\mathbb{R}$.
\end{block}
\vspace{0.4em}
\begin{itemize}
\item Each $1$-Lipschitz function $f$ is viewed as an \textbf{observable} on $X$.
\item The pushforward measure $f_*\mu_X$ is the distribution of the values of that observable.
\item If $\obdiam_{\mathbb{R}}(X;-\kappa)$ is small, then \emph{every} $1$-Lipschitz observable is strongly concentrated.
\end{itemize}
\end{frame}
\begin{frame}{A Geometric Consequence}
In this thesis, entropy functions are used as concrete observables to estimate observable diameter, and the Hopf fibration helps transfer information between $S^{2n+1}$ and $\mathbb{C}P^n$.
\vspace{0.4em}
\begin{block}{Projective-space estimate}
For $0<\kappa<1$,
$$
\obdiam(\mathbb{C}P^n(1);-\kappa)\leq O(\sqrt{n}).
$$
\end{block}
\begin{itemize}
\item First estimate observable diameter on spheres via Gaussian limits.
\item Then use the Hopf map $S^{2n+1}(1)\to \mathbb{C}P^n$.
\item This gives a geometric explanation for why many projective-space observables concentrate.
\end{itemize}
\end{frame}
\section{Numerical Section}
\begin{frame}{Entropy-Based Simulations}
\begin{itemize}
\item Sample Haar-random pure states in $\mathbb{C}^{d_A}\otimes\mathbb{C}^{d_B}$.
\item Compute reduced density matrices and entanglement entropy.
\item Measure shortest intervals containing mass $1-\kappa$ in the entropy distribution.
\item Compare concentration across:
\begin{itemize}
\item real spheres,
\item complex projective spaces,
\item symmetric states via Majorana stellar representation.
\end{itemize}
\end{itemize}
\end{frame}
\begin{frame}{What the Data Suggests}
\begin{columns}[T]
\column{0.5\textwidth}
\begin{figure}
\includegraphics[width=\textwidth]{../latex/images/entropy_vs_dim.png}
\end{figure}
\centering
Entropy vs.\ ambient dimension
\column{0.5\textwidth}
\begin{figure}
\includegraphics[width=\textwidth]{../latex/images/entropy_vs_dA.png}
\end{figure}
\centering
Entropy vs.\ subsystem dimension
\end{columns}
\vspace{0.6em}
As dimension increases, the entropy distribution concentrates near the maximal value.
\end{frame}
\section{Conclusion}
\begin{frame}{Conclusion and Outlook}
\begin{itemize}
\item Concentration of measure explains generic high entanglement in large bipartite systems.
\item Complex projective space provides the natural geometric setting for pure quantum states.
\item Observable diameter gives a way to phrase concentration geometrically.
\item Ongoing directions:
\begin{itemize}
\item sharper estimates for $\mathbb{C}P^n$,
\item deeper use of Fubini--Study geometry,
\item Majorana stellar representation for symmetric states.
\end{itemize}
\end{itemize}
\end{frame}
\section{References}
\begin{frame}[allowframebreaks]{References}
\nocite{*}
\bibliographystyle{apalike}
\bibliography{references}
\end{frame}
\begin{frame}
\begin{center}
Q\&A
\end{center}
\end{frame}
\end{document}