recce.ltx

% Copyright 2015 Jeffrey Kegler
% This document is licensed under
% a Creative Commons Attribution-NoDerivs 3.0 United States License.
\documentclass[12pt,openany,twoside]{amsbook}
% \RequirePackage[l2tabu, orthodox]{nag}
\usepackage{microtype}
\usepackage{ragged2e}
\usepackage{mathtools}
\usepackage{tikz-cd}
\usepackage{tikz-qtree}
\usetikzlibrary{decorations.pathmorphing}
\usepackage{amssymb}
\usepackage{amsmidx}
\usepackage{url}
\usepackage{amsfonts}% to get the \mathbb alphabet
\usepackage{float}
\floatstyle{boxed}
\restylefloat{figure}
% \usepackage[columns=1]{idxlayout}
\usepackage[pdfpagelabels]{hyperref}
\usepackage{algpseudocode}
\usepackage{algorithm}

\allowdisplaybreaks

% In "Writing a thesis with LATEX", Lapo F. Mori
% says anything but '[tb]' and '[p]' for floats
% is counterproductive.  I switched over based on
% his suggestion, and he's absolutely right.

% for escaping in index commands ...
%    the quote sign does not seem to work in amsmidx
\newcommand{\Pipe}{\char‘\|}
\makeindex{recce-general}
\makeindex{recce-algorithms}
% \makeindex{recce-figures}
\makeindex{recce-theorems}
\makeindex{recce-definitions}
\makeindex{recce-notation}

% This is used to find the font size if need be
% its uses are usually commented out
\makeatletter
\newcommand\thefontsize[1]{{#1 The current font size is: \f@size pt\par}}
\makeatother

% \DeclareMathSizes{6}{6}{6}{6}
% \DeclareMathSizes{8}{8}{8}{8}
% \DeclareMathSizes{10}{10}{10}{10}
% \DeclareMathSizes{10.95}{10.95}{10.95}{10.95}
% \DeclareMathSizes{12}{12}{12}{12}
% \DeclareMathSizes{14.4}{14.4}{14.4}{14.4}
% \DeclareMathSizes{20.74}{20.74}{20.74}{20.74}
% \DeclareMathSizes{24.88}{24.88}{24.88}{24.88}

\newcommand{\mysee}[2]{\emph{see} #1}
\newcommand{\myixentry}[2]{#1}

% \newcommand{\todo}[1]{\par{\large\textbf Todo: #1}\par}

% I use multi-character variable names, and TeX's usual math italic
% does not work well for them.  Rather than get into changing the
% default math font, I use a special macro for variables.
% It also allows me to use hyphens in variable names.
\newcommand{\var}[1]{\ensuremath{\texttt{#1}}}

% Many of the macros have two forms --
% '\xyz' and '\Vxyz'.  The \Vxyz is the same
% as the \xyz form, except that it typesets its
% argument as a math variable in the style of this
% monograph.

\newcommand{\myfnname}[1]{\ensuremath{\texttt{#1}}}
\newcommand{\myopname}[1]{\ensuremath{\texttt{#1}}}
\newcommand{\myfn}[2]{\ensuremath{\myfnname{#1}(#2)}}

\newcommand{\vat}[2]{\ensuremath{\myfnname{v}(#1,#2)}}
\newcommand{\vatp}[3]{\ensuremath{\myfnname{v}(#1,#2,#3)}}

% definitions for "elements" -- x[i]
\newcommand{\el}[2]{\ensuremath{\texttt{#1}[#2]}}
\newcommand{\Vel}[2]{\el{#1}{\var{#2}}}

% definitions for "operators" -- x(a, ...)
\newcommand{\op}[2]{\ensuremath{\texttt{#1}(#2)}}
\newcommand{\iop}[3]{\ensuremath{
  \myfnname{#1}^{\displaystyle #2}(#3)
}}
\newcommand{\bigop}[2]{\ensuremath{\texttt{#1}\big(#2\big)}}
\newcommand{\Vop}[2]{\op{#1}{\var{#2}}}

% For a type name, when it occurs in text
\newcommand{\type}[1]{\ensuremath{#1}}
% For defining a type
\newcommand{\dtype}[1]{\type{#1}%
  \index{recce-definitions}{#1 (type)}%
  \index{recce-notation}{#1@\ensuremath{\var{x}_{#1}} (#1 type)}%
}

\newcommand{\defined}{\mathrel{\underset{\text{def}}{\equiv}}}
\newcommand{\xdfn}[2]{\textbf{#1}\index{recce-definitions}{#2}}
\newcommand{\dfn}[1]{\xdfn{#1}{#1}}
\newcommand{\qdfn}[1]{{\textbf{#1}}}
\newcommand{\sep}{\,\mid\,}
\newcommand{\mydot}{\raisebox{.05em}{$\,\bullet\,$}}
\newcommand{\cat}{}
\newcommand{\Cat}{\,.\,}
\newcommand{\size}[1]{\ensuremath{\left | {#1} \right |}}
\newcommand{\bigsize}[1]{\ensuremath{\bigl| {#1} \bigr|}}
\newcommand{\order}[1]{\ensuremath{{\mathcal O}(#1)}}
\newcommand{\Oc}{\order{1}}
\newcommand{\On}[1][]{%
  \ifthenelse{\equal{#1}{}}%
    {\ensuremath{\order{\var{n}}}}%
    {\ensuremath{\order{\var{n}^{#1}}}}%
}
\newcommand{\LRk}{\ensuremath{\var{LR}(\var{k})}}
\newcommand{\inference}[2]{\genfrac{}{}{1pt}{}{#1}{#2}}

\newcommand{\undefined}{\ensuremath{\mathord{\perp}}}

% I use hyphens in variable names,
% so I need to ensure that subtraction is
% clearly distinguished by the typography
\newcommand{\subtract}{\,{}-\,}
\newcommand{\xxsubtract}[2]{\ensuremath{#1\,{}-\,#2}}
\newcommand{\decr}[1]{\xxsubtract{#1}{1}}
\newcommand{\Vdecr}[1]{\decr{\var{#1}}}
\newcommand{\incr}[1]{\ensuremath{#1 + 1}}
\newcommand{\Vincr}[1]{\incr{\var{#1}}}

\newcommand{\de}{\mathrel{::=}}
\newcommand{\derives}{\mapsto}
\newcommand{\nderives}[1]{
\mathrel{%
  \ifthenelse{\equal{#1}{}}{%
    {\not\mapsto}%
  }{%
    {\mbox{$\:\stackrel{\!{#1}}{\not\mapsto\!}\:$}}%
  }%
}}%
\newcommand{\xderives}[1]
    {\mathrel{\mbox{$\:\stackrel{\!{#1}}{\mapsto\!}\:$}}}
\newcommand{\destar}
    {\mathrel{\mbox{$\:\stackrel{\!{\ast}}{\mapsto\!}\:$}}}
\newcommand{\ndestar}{\nderives{\ast}}
\newcommand{\deplus}
    {\mathrel{\mbox{$\:\stackrel{\!{+}}{\mapsto\!}\:$}}}
\newcommand{\ndeplus}{\nderives{+}}
\newcommand{\derivg}[1]{\mathrel{\mbox{$\:\mapsto\:$}}}
\newcommand{\derivrg}[2]{\mathrel{\mbox{$\:\stackrel{\!{#1}}%
        {\mapsto\!}\:$}}}
\newcommand{\drv}[3]{\ensuremath{\texttt{#1}[#2][#3]}}
\newcommand{\drvVV}[3]{\drv{#1}{\var{#2}}{\var{#3}}}
% \newcommand{\lblarrow}[1]
    % {\mathrel{\mbox{$\:\stackrel{\!{#1}}{\mapsto\!}\:$}}}

\newcommand{\set}[1]{{\left\lbrace #1 \right\rbrace} }
\newcommand{\bigset}[1]{{\bigl\lbrace #1 \bigr\rbrace} }
\newcommand{\Bigset}[1]{{\Bigl\lbrace #1 \Bigr\rbrace} }
\newcommand{\dr}[1]{#1_{DR}}
\newcommand{\Vdr}[1]{\ensuremath{\var{#1}_{DR}}}
\newcommand{\Vdrset}[1]{\ensuremath{\var{#1}_{\set{DR}}}}
\newcommand{\eim}[1]{#1_{EIM}}
\newcommand{\Veim}[1]{\ensuremath{\var{#1}_{EIM}}}
\newcommand{\Veimset}[1]{\ensuremath{\var{#1}_{\set{EIM}}}}
\newcommand{\leo}[1]{#1_{LEO}}
\newcommand{\Vleo}[1]{\ensuremath{\var{#1}_{LEO}}}
\newcommand{\inst}[1]{#1_{INST}}
\newcommand{\Vinst}[1]{\ensuremath{\var{#1}_{INST}}}
\newcommand{\Ees}[1]{\ensuremath{#1_{ES}}}
\newcommand{\loc}[1]{\ensuremath{{#1}_{LOC}}}
\newcommand{\Vloc}[1]{\loc{\var{#1}}}
\newcommand{\Ves}[1]{\Ees{\var{#1}}}
\newcommand{\Vrule}[1]{\ensuremath{\var{#1}_{RULE}}}
\newcommand{\Vruleset}[1]{\ensuremath{\var{#1}_{\set{RULE}}}}
\newcommand{\Vsize}[1]{\ensuremath{\size{\var{#1}}}}
\newcommand{\str}[1]{\ensuremath{#1_{STR}}}
\newcommand{\Vstr}[1]{\ensuremath{\langle\langle\var{#1}\rangle\rangle}}
\newcommand{\sym}[1]{\ensuremath{#1_{SYM}}}
\newcommand{\Vsym}[1]{\ensuremath{\langle\var{#1}\rangle}}
\newcommand{\Vorig}[1]{\ensuremath{\var{#1}_{ORIG}}}
\newcommand{\symset}[1]{#1_{\lbrace SYM \rbrace} }
\newcommand{\Vsymset}[1]{\ensuremath{\var{#1}_{\set{SYM}}}}
\newcommand{\term}[1]{#1_{TERM}}
\newcommand{\mk}[1]{\ensuremath{\lfloor#1\rceil}}
\newcommand{\bigmk}[1]{\big\lfloor#1\big\rceil}
% \newcommand{\mkdelim}{\,\,}
\newcommand{\mkdelim}{}
\newcommand{\mkr}[1]{\mkdelim \mk{#1}}
\newcommand{\mkl}[1]{\mk{#1} \mkdelim}
\newcommand{\mkm}[1]{\mkdelim \mk{#1} \mkdelim}
\newcommand{\Vmk}[1]{\mk{\var{#1}}}
\newcommand{\Vmkl}[1]{\Vmk{#1} \mkdelim}
\newcommand{\Vmkr}[1]{\mkdelim \Vmk{#1}}
\newcommand{\Vmkm}[1]{\mkdelim \Vmk{#1} \mkdelim}

\newcommand{\lastix}[1]{\ensuremath{
% I want a hash sign to be a 'last index' operator, but
% the regular hash sign is ungainly and not resizeable.
% This tames it a bit.
  {\protect\scalebox{0.8}{\protect\raisebox{0.4ex}{\#}}{#1}}
}}
\newcommand{\Vlastix}[1]{\lastix{\var{#1}}}

\newcommand{\alg}[1]{\ensuremath{\textsc{#1}}}
\newcommand{\Earley}{\ensuremath{\alg{Earley}}}
\newcommand{\Leo}{\ensuremath{\alg{Leo}}}
\newcommand{\Marpa}{\ensuremath{\alg{Marpa}}}

\newcommand{\Alt}[1]{\ensuremath{\myfnname{Alt}(#1)}}
\newcommand{\Cdr}{\var{dr}}
\newcommand{\Cg}{\var{g}}
\newcommand{\Crules}{\var{rules}}
\newcommand{\Current}[1]{\ensuremath{\myfnname{Current}(#1)}}
\newcommand{\CVw}[1]{\ensuremath{\sym{\Cw[\var{#1}]}}}
\newcommand{\CW}{\ensuremath{\mathbb W}}
\newcommand{\Cw}{\var{w}}
\newcommand{\Dotix}[1]{\ensuremath{\myfnname{Dotix}(#1)}}
\newcommand{\DR}[1]{\ensuremath{\myfnname{DR}(#1)}}
\newcommand{\GOTO}{\ensuremath{\myfnname{GOTO}}}
\newcommand{\ID}[1]{\myfnname{ID}(#1)}
\newcommand{\Layer}[1]{\ensuremath{\myfnname{Layer}(#1)}}
\newcommand{\Leosilo}[1]{\ensuremath{\myfnname{Leo-silo}(#1)}}
\newcommand{\Maximal}[1]{\ensuremath{\myfnname{Maximal}(#1)}}
\newcommand{\Maxleosilo}[2]{\ensuremath{\myfnname{Max-Leo-silo}(#1, #2)}}
\newcommand{\Left}[1]{\ensuremath{\myfnname{Left}(#1)}}
\newcommand{\LHS}[1]{\ensuremath{\myfnname{LHS}(#1)}}
\newcommand{\Memo}[1]{\ensuremath{\myfnname{Memo}(#1)}}
\newcommand{\Memoized}[1]{\ensuremath{\myfnname{Memoized}(#1)}}
\newcommand{\myL}[1]{\myfnname{L}(#1)}
\newcommand{\Next}[1]{\myfnname{Next}(#1)}
\newcommand{\Origin}[1]{\ensuremath{\myfn{Origin}{#1}}}
\newcommand{\Penult}[1]{\myfnname{Penult}(#1)}
\newcommand{\Postdot}[1]{\ensuremath{\myfnname{Postdot}(#1)}}
\newcommand{\Predict}[1]{\myfnname{Predict}(#1)}
\newcommand{\Predot}[1]{\ensuremath{\myfnname{Predot}(#1)}}
\newcommand{\Prev}[1]{\myfnname{Prev}(#1)}
\newcommand{\PSL}[2]{\myfnname{PSL}[#1][#2]}
\newcommand{\RHS}[1]{\ensuremath{\myfnname{RHS}(#1)}}
\newcommand{\Right}[1]{\ensuremath{\myfnname{Right}(#1)}}
\newcommand{\Rule}[1]{\ensuremath{\myfnname{Rule}(#1)}}
\newcommand{\Silo}[1]{\ensuremath{\myfnname{Silo}(#1)}}
\newcommand{\Symbol}[1]{\ensuremath{\myfnname{Symbol}(#1)}}
\newcommand{\Valid}[1]{\ensuremath{\myfnname{Valid}(#1)}}
\newcommand{\Instantiated}[1]{\ensuremath{\myfnname{Instantiated}(#1)}}
\newcommand{\PLSY}[1]{\ensuremath{\myfnname{PLSY}(#1)}}
\newcommand{\LSY}[1]{\ensuremath{\myfnname{LSY}(#1)}}
\newcommand{\SymEq}[1]{\ensuremath{\myfnname{Sym-Eq}(#1)}}

\newcommand\Ctables{\var{tables}}
\newcommand\Vtables[1]{\Ctables[\alg{#1}]}

\newcommand\Etable[1]{\ensuremath{\myfnname{table}[#1]}}
\newcommand\bigEtable[1]{\ensuremath{\myfnname{table}\bigl[#1\bigr]}}
\newcommand\Rtable[1]{\ensuremath{\myfnname{table}[#1]}}
\newcommand\Rtablesize[1]{\ensuremath{\bigl| \myfnname{table}[#1] \bigr|}}
\newcommand\Vtable[1]{\Etable{\var{#1}}}
\newcommand\EEtable[2]{\ensuremath{\myfnname{table}[#1,#2]}}
\newcommand\EVtable[2]{\EEtable{#1}{\var{#2}}}

% I want to use 'call' outside of pseudocode
\newcommand\mycallname[1]{\textproc{#1}}
\newcommand\call[2]{\mycallname{#1}\ifthenelse{\equal{#2}{}}{}{(#2)}}%

% I don't like to put whole paragraphs in italics,
% so I make this simple variation on the "plain" theoremstyle
\newtheoremstyle{myplain}
  {10pt}   % ABOVESPACE
  {10pt}   % BELOWSPACE
  {\normalfont}  % BODYFONT
  {0pt}       % INDENT (empty value is the same as 0pt)
  {\bfseries} % HEADFONT
  {.}         % HEADPUNCT
  {5pt plus 1pt minus 1pt} % HEADSPACE
  {}          % CUSTOM-HEAD-SPEC

\theoremstyle{myplain}

% \newtheorem{oldtheorem}{Theorem}[chapter]
\newtheorem{oldtheorem}{Theorem}
\newenvironment{theorem}
{
  \begin{oldtheorem}
}
{
  % \begin{center}
  % \vspace{-.4\baselineskip}
  % \rule{3em}{.5pt}
  % \end{center}
  \end{oldtheorem}
}

\newtheorem{lemma}[oldtheorem]{Lemma}

\newtheorem{baredefinition}[oldtheorem]{Definition}
\newenvironment{definition}{ \begin{baredefinition}
}{ \begin{center}
\nopagebreak[4]%
\vspace{-.4\baselineskip}%
\nopagebreak[4]%
\rule{3em}{.5pt}
\pagebreak[0]
\end{center} \end{baredefinition} }

\newtheorem{bareobservation}[oldtheorem]{Observation}
\newenvironment{observation}{ \begin{bareobservation}
}{ \begin{center}
\vspace{-.4\baselineskip}
\rule{3em}{.5pt}
\end{center} \end{bareobservation} }

\newtheorem{bareconstruction}[oldtheorem]{Construction}
\newenvironment{construction}{ \begin{bareconstruction}
}{ \begin{center}
\vspace{-.4\baselineskip}
\rule{3em}{.5pt}
\end{center} \end{bareconstruction} }

\newcommand{\padnum}[1]{%
   \ifnum #1 < 10 0\fi%
   \ifnum #1 < 100 0\fi%
   \ifnum #1 < 1000 0\fi%
   #1%
}
% My macros for definition & theorem titles and references
% The 'q' forms are 'quiet' -- they do not index
% Don't use definition titles for index -- use \xdfn instead.
\newcommand\dtitle[1]{\textbf{#1}:\index{recce-theorems}{%
  \padnum{\theoldtheorem}@Definition \theoldtheorem. #1%
}}
% \newcommand\dtitle[1]{\textbf{#1}:}
\newcommand{\rawdref}[2]{%
  \ifthenelse{\equal{#1}{}}%
  {(D\ref{#2})}%
  {(D\ref{#2} ``#1'')}%
}
\newcommand{\dref}[2][]{%
   \ifmmode{\text{\rawdref{#1}{#2}}}%
   \else{\rawdref{#1}{#2}}%
   \fi%
}
% \newcommand\qdtitle[1]{\textbf{#1}:}
\newcommand\ttitle[1]{\textbf{#1}:\index{recce-theorems}{%
  \padnum{\theoldtheorem}@Theorem \theoldtheorem. #1%
}
}
\newcommand\tref[1]{\text{(T\ref{#1})}}
\newcommand\lemref[1]{\text{(L\ref{#1})}}
\newcommand\ltitle[1]{\textbf{#1}:\index{recce-theorems}{%
  \padnum{\theoldtheorem}@Lemma \theoldtheorem. #1%
}}

\newcommand{\algtitle}[2]{%
  \caption{#1}
  \label{#2}
  \index{recce-algorithms}{%
  Algorithm \padnum{\thealgorithm}@Algorithm \thealgorithm: #1%
}}

\newcommand{\figtitle}[2]{%
  \caption{#1}
  \label{#2}
  \index{recce-algorithms}{%
  Figure \padnum{\thefigure}@Figure \thefigure: #1%
}}

\newcommand{\becuz}{\ensuremath{\because}}

\hyphenation{oper-and oper-ands}
\hyphenation{look-ahead}
\hyphenation{memo-ization}
\hyphenation{al-ti-tude}

% I use parboxes in equations.  This sets a useful width for them.
\newlength{\mathparwidth}
\newlength{\longtagwidth}
\settowidth{\longtagwidth}{(9999)\quad}
\setlength{\mathparwidth}{\dimexpr\textwidth-\longtagwidth}
\newcommand{\myparbox}[2][\mathparwidth]{%
  \parbox[t]{#1}{%
  \raggedright#2\par
  \vspace{-\prevdepth} % remove the depth of the last line
  \vspace{1ex} % add a fixed vertical space
  }%
}

% \makeindex
\begin{document}

\title{The Marpa book}

\author{Jeffrey Kegler}
\thanks{%
Copyright \copyright\ 2015 Jeffrey Kegler.
}
\thanks{%
This document is licensed under
a Creative Commons Attribution-NoDerivs 3.0 United States License.
}

\thanks{\textbf{This is a draft.}}
\thanks{Date: \today}

% \begin{abstract}
% Marpa is
% a practical and fully implemented
% algorithm for the recognition,
% parsing and evaluation of context-free grammars.
% The Marpa recognizer is the first
% practical implementation
% of the improvements
% to Earley's algorithm found in
% Joop Leo's%
% \index{recce-general}{Leo, Joop}
% 1991 paper.
% Marpa has a new parse engine that
% allows the user to alternate
% between Earley-style syntax-driven parsing,
% and procedural parsing of the type available
% with recursive descent.
% Marpa is left-eidetic so that,
% unlike recursive descent,
% Marpa's procedural logic has available
% full information about
% the state of the parse so far.
% The Marpa recognizer described
% is a simplification of that
% in our 2013 paper~\cite{Marpa-2013}.
% \end{abstract}

\maketitle

\chapter{Status of this paper}
This paper is a draft.
Please use the date at the bottom of the
first page
to make sure this is the latest revision.
If this revision is not the latest, please ignore it.
If this does seems to be the latest version,
and you are adventurous,
then read on.
Chapters
\ref{ch:introduction},
\ref{ch:preliminaries},
\ref{ch:rewrite},
\ref{ch:dotted},
\ref{ch:earley-items},
\ref{ch:tethers}
and
\ref{ch:earley-tables}
are in the ``advanced draft'' stage.
Advanced draft chapters are still subject to revision,
but the author hopes they are stable enough
to make comments and corrections useful.
Readers should note that changes in early draft chapters
sometimes require changes
to chapters whose content was thought to
be settled.
Therefore, it is possible that
even chapters in advanced draft status
will change dramatically.

TODO: When done with this revision, update chapters

Chapters
\ref{ch:silos},
\ref{ch:leo},
\ref{ch:pseudocode},
\ref{ch:correctness},
and
\ref{ch:complexity}
are in \dfn{early draft} stage.
``Early draft'' means that the author's thoughts are not well settled,
and the chapters are likely to contain inconsistencies and errors.
Comments and corrections on early draft
chapters are not encouraged ---
the material may be already slated for deletion,
rewriting or rethinking.

\chapter{Introduction}
\label{ch:introduction}

The Marpa project was intended to create
a practical and highly available tool
to generate and use general context-free
parsers.
Tools of this kind
had long existed
for LALR~\cite{Johnson} and
regular expressions.
But, despite an encouraging academic literature,
no such tool had existed for context-free parsing.

The first stable version of Marpa was uploaded to
a public archive on Solstice Day 2011.
This monograph describes the algorithm used
in the most recent version of Marpa,
Marpa::R2~\cite{Marpa-R2}.
It is a simplification of the algorithm presented
in our earlier paper~\cite{Marpa-2013}.

\section{A proven algorithm}

While the presentation in this monograph is theoretical,
the approach is practical.
The Marpa::R2 implementation has been widely available
for some time,
and has seen considerable use,
including in production environments.
Many of the ideas in the parsing literature
satisfy theoretical criteria,
but in practice turn out to face significant obstacles.
An algorithm may be as fast as reported, but may turn
out not to allow
adequate error reporting.
Or a modification may speed up the recognizer,
but require additional processing at evaluation time,
leaving no advantage to compensate for
the additional complexity.

In this monograph, we describe the Marpa
algorithm
as it was implemented for Marpa::R2.
In many cases,
we believe there are better approaches than those we
have described.
But we treat these techniques,
however solid their theory,
as conjectures.
Whenever we mention a technique
that was not actually implemented in
Marpa::R2,
we will always explicitly state that
that technique is not in Marpa as implemented.

\section{Features}

\subsection{General context-free parsing}
As implemented,
Marpa parses
all ``proper'' context-free grammars.
The
proper context-free grammars are those which
are free of cycles,
unproductive symbols,
and
inaccessible symbols.
Worst case time bounds are never worse than
those of Earley~\cite{Earley1970},
and therefore never worse than $\order{\var{n}^3}$.

\subsection{Linear time for practical grammars}
Currently, the grammars suitable for practical
use are thought to be a subset
of the deterministic context-free grammars.
Using a technique discovered by
Leo~\cite{Leo1991},
Marpa parses all of these in linear time.
Leo's modification of Earley's algorithm is
\On{} for LR-regular grammars.
Leo's modification
also parses many ambiguous grammars in linear
time.

\subsection{Left-eidetic}
The original Earley algorithm kept full information
about the parse ---
including partial and fully
recognized rule instances ---
in its tables.
At every parse location,
before any symbols
are scanned,
Marpa's parse engine makes available
its
information about the state of the parse so far.
This information is
in useful form,
and can be accessed efficiently.

\subsection{Recoverable from read errors}
When
Marpa reads a token which it cannot accept,
the error is fully recoverable.
An application can try to read another
token.
The application can do this repeatedly
as long as none of the tokens are accepted.
Once the application provides
a token that is accepted by the parser,
parsing will continue
as if the unsuccessful read attempts had never been made.

\subsection{Ambiguous tokens}
Marpa allows ambiguous tokens.
These are often useful in natural language processing
where, for example,
the same word might be a verb or a noun.
Use of ambiguous tokens can be combined with
recovery from rejected tokens so that,
for example, an application could react to the
rejection of a token by reading two others.

\section{Using the features}

\subsection{Error reporting}
An obvious application of left-eideticism is error
reporting.
Marpa's abilities in this respect are
ground-breaking.
For example,
users typically regard an ambiguity as an error
in the grammar.
Marpa, as currently implemented,
can detect an ambiguity and report
specifically where it occurred
and what the alternatives were.

\subsection{Event driven parsing}
As implemented,
Marpa::R2~\cite{Marpa-R2}
allows the user to define ``events''.
Events can be defined that trigger when a specified rule is complete,
when a specified rule is predicted,
when a specified symbol is nulled,
when a user-specified lexeme has been scanned,
or when a user-specified lexeme is about to be scanned.
A mid-rule event can be defined by adding a nulling symbol
at the desired point in the rule,
and defining an event which triggers when the symbol is nulled.

\subsection{Ruby slippers parsing}
Left-eideticism, efficient error recovery,
and the event mechanism can be combined to allow
the application to change the input in response to
feedback from the parser.
In traditional parser practice,
error detection is an act of desperation.
In contrast,
Marpa's error detection is so painless
that it can be used as the foundation
of new parsing techniques.

For example,
if a token is rejected,
the lexer is free to create a new token
in the light of the parser's expectations.
This approach can be seen
as making the parser's
``wishes'' come true,
and we have called it
``Ruby Slippers Parsing''.

One use of the Ruby Slippers technique is to
parse with a clean
but oversimplified grammar,
programming the lexical analyzer to make up for the grammar's
short-comings on the fly.
As part of Marpa::R2~\cite{Marpa-R2},
the author has implemented an HTML parser,
based on a grammar that assumes that all start
and end tags are present.
Such an HTML grammar is too simple even to describe perfectly
standard-conformant HTML,
but the lexical analyzer is
programmed to supply start and end tags as requested by the parser.
The result is a simple and cleanly designed parser
that parses very liberal HTML
and accepts all input files,
in the worst case
treating them as highly defective HTML.

\subsection{Ambiguity as a language design technique}
In current practice, ambiguity is avoided in language design.
This is very different from the practice in the languages humans choose
when communicating with each other.
Human languages exploit ambiguity in order to design highly flexible,
powerfully expressive languages.
For example,
the language of this monograph, English, is notoriously
ambiguous.

Ambiguity of course can present a problem.
A sentence in an ambiguous
language may have undesired meanings.
But note that this is not a reason to ban potential ambiguity ---
it is only a problem with actual ambiguity.

Syntax errors, for example, are undesired, but nobody tries
to design languages to make syntax errors impossible.
A language in which every input was well-formed and meaningful
would be cumbersome and even dangerous:
all typos in such a language would be meaningful,
and parser would never warn the user about errors, because
there would be no such thing.

With Marpa, ambiguity can be dealt with in the same way
that syntax errors are dealt with in current practice.
The language can be designed to be ambiguous,
but any actual ambiguity can be detected
and reported at parse time.
This exploits Marpa's ability
to report exactly where
and what the ambiguity is.
Marpa::R2 own parser description language, the SLIF,
uses ambiguity in this way.

\subsection{Auto-generated languages}
\cite[pp. 6-7]{Culik1973} points out that the ability
to efficiently parse LR-regular languages
opens the way to auto-generated languages.
In particular,
\cite{Culik1973} notes that a parser which
can parse any LR-regular language will be
able to parse a language generated using syntax macros.

\subsection{Second order languages}
In the literature, the term ``second order language''
is usually used to describe languages with features
which are useful for second-order programming.
True second-order languages --- languages which
are auto-generated
from other languages ---
have not been seen as practical,
since there was no guarantee that the auto-generated
language could be efficiently parsed.

With Marpa, this barrier is raised.
As an example,
Marpa::R2's own parser description language, the SLIF,
allows ``precedenced rules''.
Precedenced rules are specified in an extended BNF.
The BNF extensions allow precedence and associativity
to be specified for each RHS.

Marpa::R2's precedenced rules are implemented as
a true second order language.
The SLIF representation of the precedenced rule
is parsed to create a BNF grammar which is equivalent,
and which has the desired precedence.
Essentially,
the SLIF does a standard textbook transformation.
The transformation starts
with a set of rules,
each of which has a precedence and
an associativity specified.
The result of the transformation is a set of
rules in pure BNF.
The SLIF's advantage is that it is powered by Marpa,
and therefore the SLIF can be certain that the grammar
that it auto-generates will
parse in linear time.

Notationally, Marpa's precedenced rules
are an improvement over
similar features
in LALR-based parser generators like
yacc or bison.
In the SLIF,
there are two important differences.
First, in the SLIF's precedenced rules,
precedence is generalized, so that it does
not depend on the operators:
there is no need to identify operators,
much less class them as binary, unary, etc.
This more powerful and flexible precedence notation
allows the definition of multiple ternary operators,
and multiple operators with arity above three.

Second, and more important, a SLIF user is guaranteed
to get exactly the language that the precedenced rule specifies.
The user of the yacc equivalent must hope their
syntax falls within the limits of LALR.

\section{How to read this document}

TODO: When done with this revision, update chapters

Chapter
\ref{ch:preliminaries} describes the notation and conventions
of this monograph.
Chapter \ref{ch:rewrite} deals with Marpa's
grammar rewrites.
The next three sections develop the ideas for Earley's algorithm.
Chapter \ref{ch:dotted} describes dotted rules.
Chapter \ref{ch:earley-items} describes Earley items.
Chapter \ref{ch:tethers} introduces tethers,
which are chains of top-down causation.
Chapter \ref{ch:earley-tables} describes
the remaining ideas behind
basic Earley implementations,
including
Earley sets
and Earley tables.
Chapter \ref{ch:silos} introduces silos.
Like tethers, silos are chains of causation,
but unlike tethers, in silos the causation is
largely bottom-up.

Chapter \ref{ch:leo} describes Leo's modification
to Earley's algorithm.
Chapter \ref{ch:pseudocode} presents the pseudocode
for Marpa's recognizer.
Chapter
\ref{ch:correctness}
contains a proof of Marpa's correctness.
Chapter \ref{ch:complexity} sets out our
time and space complexity results.

Because of its practical applications,
we expect this monograph to be of interest to many
who do not ordinarily read documents with this
level of mathematical apparatus.
For those readers, we offer some suggestions
which will be well known to our more mathematical
readers.

In most fields, texts are intended to be,
and often are, read through to the end,
starting at page one.
A monograph of this kind is rarely
read that way.
Even the most mathematical sophisticated
reader will skip most or all
of the proofs
on a first reading.
And a mathematically inclined
reader will usually
not read a proof line-by-line
unless and until her previous readings
have convinced her that the proof
is of sufficient
interest to deserve this kind of
attention.

This is not to say that we think
that the proofs are unimportant.
The proofs explore how our ideas
and claims
are connected to each other.
There is a aesthetic satisfaction in
this deeper level of knowledge.
And the proofs
increase our
assurance that our claims are, in fact, true.

But the proofs are also of practical use,
even to the programmer who is willing to
take our word for everything in these pages.
If, when coding,
the programmer only knows ``what'' and ``how'',
he will find it hard to keep all of this material
in his mind at once.
If the programmer knows,
not just ``what'' and ``how'',
but also ``why'',
he will understand the connections among
these ideas.
When the programmer
understands ``why'',
the book is always open in front of him,
turned to whatever page it is that
he needs.

We expect
most readers of this monograph
to have a practical bent.
For those readers,
one way to start is to read the preliminary
material for as long as it seems relevant,
skipping the lemmas,
as well as the proofs for both lemmas and
theorems.
When impatience for something ``closer to
the metal'' arises,
this reader should
jump ahead
to the pseudocode in
Chapter \ref{ch:pseudocode}.

\chapter{Preliminaries}
\label{ch:preliminaries}

We assume familiarity with the theory of parsing.
Earley's algorithm is described in full,
but previous familiarity will be helpful.

\section{Notation}

This monograph will
use subscripts to indicate commonly occurring types.
\begin{center}
\begin{tabular}{ll}
$\var{X}_T$ & The variable \var{X} of type \type{T} \\
$\var{set-one}_\set{T}$ & The variable \var{set-one} of type set of \type{T} \\
\type{SYM} & The type for a symbol \\
\type{STR} & The type for a string \\
\type{EIM} & The type for an Earley item \\
\sym{\var{a}} & A variable \var{a} of type \type{SYM} \\
\str{\var{a}} & A variable \var{a} of type \type{STR} \\
\Veim{a} & A variable \var{a} of type \type{EIM} \\
\Vsymset{set-two} & The variable \var{set-two}, a set of strings \\
\Veimset{set-two} & The variable \var{set-two}, a set of Earley items
\end{tabular}
\end{center}
Strings and symbols occur frequently and have a special
notation:
\begin{center}
\begin{tabular}{ll}
\Vsym{a} & \var{a}, a symbol variable \\
\Vstr{a} & \var{a}, a string variable
\end{tabular}
\end{center}%
\index{recce-notation}{<<sym>>@\Vstr{sym}}%
\index{recce-notation}{<str>@\Vsym{sym}}
Subscripts may be omitted when the type
is obvious from the context.
The notation for
constants is the same as that for variables.
Multi-character variable names will be common.

Concatenation is shown
only when useful for clarity.
All other operations are always explicit.
\begin{center}
\begin{tabular}{ll}
Multiplication &  $\var{a} \times \var{b}$ \\
Concatenation & $\var{a} \Cat \var{b}$ \\
Subtraction & $\var{symbol-count} \subtract \var{terminal-count}$ \\
\end{tabular}
\end{center}

Where $\myfnname{f}$ is a function,
we use the notation $\myfnname{f}^{\displaystyle \var{n}}$
for the iterated function, so that
\begin{align*}
\myfnname{f}^0(\var{x}) \quad & \defined \quad \var{x}, \\
\myfnname{f}^1(\var{x}) \quad & \defined \quad \myfnname{f}(\var{x}), \\
\myfnname{f}^2(\var{x}) \quad & \defined \quad
  \myfnname{f}(\myfnname{f}(\var{x})), \quad \text{etc.} \\
\text{Also,} \quad \myfnname{f}^\ast \quad & \defined \quad
\myfnname{f}^\var{n} \quad \text{for some $\var{n} \ge 0$ and} \\
\myfnname{f}^+ \quad & \defined \quad
\myfnname{f}^\var{n} \quad \text{for some $\var{n} \ge 1$}.
\end{align*}

The statements of this monograph often require us to introduce
many new variables at once,
so that we might say,
``for some \var{a}, \var{b}, \var{c}, \ldots{} \var{z},
let \ldots{}''.
When we introduce an definition, and it
contains new variables
which cause no loss of generality,
we will prefer to simply say so,
noting any exceptions.
In cases where brevity is important,
such as in proofs,
we may abbreviate
``without loss of generality'' as \dfn{WLOG},
``assumption'' as \dfn{ASM},
``theorem'' as \dfn{Th},
and
``definition'' as \dfn{Def}.

We use the standard notation for equations,
writing
``(\textit{n})'' to refer to equation \textit{n}.%
\index{recce-notation}{(0)@(\textit{n})}
To indicate references, we write,
where \var{n} is a reference number,
(L\textit{n})%
\index{recce-notation}{(L0)@(L\textit{n})}%
\index{recce-notation}{L0@(L\textit{n})}
to say Lemma \textit{n},
(T\textit{n})%
\index{recce-notation}{(T0)@(T\textit{n})}%
\index{recce-notation}{T0@(T\textit{n})}
to say Theorem \textit{n}
and
(D\textit{n})%
\index{recce-notation}{(D0)@(D\textit{n})}%
\index{recce-notation}{D0@(D\textit{n})}
to say Definition \textit{n}.
A definition reference may define several terms:
when we wish to pinpoint one of these we write
the reference
(D\textit{n} ``\textit{x}'')%
\index{recce-notation}{(D0 "x")@(D\textit{n} ``\textit{x}'')}%
\index{recce-notation}{D0 x@(D\textit{n} ``\textit{x}'')}
to say the definiton
of ``\textit{n}'' in Definition section
with reference number \textit{n}.
For example, we would write
\[
\begin{aligned}
& \text{(D42) to say Definition 42;} \\
& \text{(D7 ``\var{x}'') to say the definition of ``x'' in Definition section 7;} \\
& \text{(T11) to say Theorem 11; and} \\
& \text{(L22) to say Lemma 22.}
\end{aligned}
\]

Metonymy,
the subsitution of one thing for another thing with
a related meaning,
is common in language.
For example, ``Hollywood'' is a town in California,
but the word is often used to mean the U.S. entertainment
industry.
Where our use of metonymy is non-obvious or non-intuitive,
we will make it a matter of explicit definition.

For example,
in what follows, we will define Earley items,
which contain dotted rules.
Dotted rules in turn contain rules.
When we apply a rule notion to a dotted rule,
we will mean to apply that notion to the rule of the dotted rule.
When we apply a dotted rule notion to an Earley item,
we will mean to apply that notion to the dotted rule
of the Earley item.
Metonymic application of
notions will be transitive so that,
for example,
when we apply a rule notion to an Earley item,
we will mean to apply that notion to the rule
of the dotted rule of the Earley item.

\section{Undefineds and non-well-defineds}

We will use the symbol \undefined%
\index{recce-notation}{"!@\undefined}
to mean ``undefined''
in various contexts.
For partial functions,
we will use the term ``domain'' as in category theory,
so that a partial function is not necessarily defined
for every element of its domain.
For example, we will write
\[
\Vop{f}{x} = \undefined
\]
to say that the partial function \myfnname{f} is
undefined for the domain element \var{x}.

\begin{definition}
\dtitle{Comparison involving undefineds}
\label{comparison-involving-undefineds}
If a value is undefined,
a second value is considered to be equal to it if and only if
that second value is also undefined:
\[
   \var{x} \, = \, \undefined \;\; \implies \;\; (\var{x} \, = \, \var{y} \; \equiv \; \var{y} \, = \, \undefined).
\]
\end{definition}

Traditionally, an expression is not well-defined if any element of
the expression is not well-defined.
We will find it convenient to define the result of
logical conjunction ($\land$),
logical disjunction ($\lor$),
and implication ($\Longrightarrow$)
% [ \Longrightarrow, not \implies, to avoid math spacing ]
for some cases where their second argument is not
well-defined.
Where its second argument is not well-defined,
\begin{itemize}
\item
an implication is well-defined and true,
if its first argument is false;
\item
a logical conjunction is well-defined and false,
if its first argument is false; and
\item
a logical disjunction is well-defined and true,
if its first argument is true.
\end{itemize}
Note that, under this convention,
logical conjunction and logical disjunction are assymmetric.

For example, in most cases the value of a function
will not be well-defined if its argument is undefined.
In the following, let
$\var{x} = \undefined$,
and assume that \Vop{F}{\undefined} is not well-defined.
Then
\begin{align}
\label{eq:not-well-def-example-1}
& (\var{x} = \undefined) \lor \; \Vop{F}{x}
&& \text{is well-defined and true;}
\\
\label{eq:not-well-def-example-2}
& (\var{x} \neq \undefined) \land \; \Vop{F}{x}
&& \text{is well-defined and false; and}
\\
\label{eq:not-well-def-example-3}
& (\var{x} \neq \undefined) \implies \Vop{F}{x}
&& \text{is well-defined and true.}
\end{align}
Note that
the first arguments in 
\eqref{eq:not-well-def-example-1},
\eqref{eq:not-well-def-example-2}
and
\eqref{eq:not-well-def-example-3}
are well-defined, because
of \dref[comparison of undefineds]{comparison-involving-undefineds}.

These conventions eliminate the need for a lot of
special cases.
We believe the reader will find these conventions
natural and convenient in practice.
These conventions about undefinedness apply even when
we write the logical operations out verbally
(``if \var{X} and \var{Y}, then \var{X} or \var{Y}'')
instead of symbolically
($\var{X} \; \land \; \var{Y} \implies \var{X} \; \lor \; \var{Y}$).

\section{Algorithms}

When referring to the value of a variable in a algorithm, we
will usually need, not just the variable's name, but its line
location and perhaps other information, such as an ordinal
describing the pass through a loop.
We will write \vat{\var{v}}{\var{n}}%
\index{recce-notation}{V(2)@\vat{\var{var}}{\var{line}}}
for the value
of \var{v} just after the execution of line \var{n}.
Where more than the line number
is needed to specify the value of \var{v},
we will use additional arguments,
as described for each algorithm.
For example,
for some algorithm
\vatp{\var{v}}{\var{n}}{\var{p}}%
\index{recce-notation}{V(2+)@\vatp{\var{var}}{\var{line}{\ldots}}},
might specify the value
of \var{v} just after the execution of line \var{n}
on the \var{p}'th pass through a loop.

\section{Sequences}

Unless otherwise specified, the indexes
of a sequence are consecutive integers,
starting with zero.
Where \var{s1} and \var{s2} are sequences,
we write
\Vlastix{s1}%
\index{recce-notation}{#@$\#$!\Vlastix{seq}}
for the last index of \var{s1};
and
$\var{s1} + \var{s2}$,%
\index{recce-notation}{+@$+$!\var{seq1}+\var{seq2}}
for the concatenation of the series \var{s2} after the series
\var{s1}.
We will write
\Vel{s1}{\var{a} \ldots \var{z}}
for the subsequence
\[
    \Vel{s1}{a}, \;\;
    \el{s1}{\Vincr{a}}, \;\;
    \ldots \;\;
    \Vel{s1}{z}.
\]

The following theorem will prove useful.

\begin{theorem}
\ttitle{Sequence overlap}
\label{t:sequence-overlap}

TODO: This theorem not reviewed.  Is it needed?
Can I delete it?

Let \var{mast} be a master sequence containing two subsequences,
\var{con} and \var{con2},
such that \var{con} does not contain the top or bottom
of \var{con2}:
\begin{gather*}
\var{con} \subseteq \var{mast}
\; \land \; \var{con2} \subseteq \var{mast} \\
\el{con2}{0} \notin \var{con}
\; \land \; \el{con2}{\Vlastix{con2}} \notin \var{con}.
\end{gather*}
Let \var{a} and \var{b} be elements,
such that
\[
\var{a} \in \var{con}
\; \land \; \var{b} \in \var{con}.
\]
Then
\[
\var{a} \in \var{con2} \equiv \var{b} \in \var{con2}.
\]
\end{theorem}

\begin{proof}
Assume,
for a reductio,
that exactly one of \var{a} and \var{b}
is an element of \var{con2}.
Without loss of generalization, we formalize
the assumption for the reductio as
\begin{equation}
\label{t:sequence-overlap-18}
  \var{a} \in \var{con2} \; \land \; \var{b} \notin \var{con2}.
\end{equation}
Since \var{con} and \var{con2} are,
by assumption for the theorem, subsequences of \var{mast},
let
\begin{align}
\label{t:sequence-overlap-20}
\var{a} & = \Vel{mast}{aix} \\
\label{t:sequence-overlap-22}
\var{b} & = \Vel{mast}{bix} \\
\label{t:sequence-overlap-24}
\Vel{con}{0} & = \Vel{mast}{loc} \\
\label{t:sequence-overlap-26}
\Vel{con}{\Vlastix{con}} & = \Vel{mast}{hic} \\
\label{t:sequence-overlap-28}
\Vel{con2}{0} & = \Vel{mast}{loc2} \\
\label{t:sequence-overlap-30}
\Vel{con2}{\Vlastix{con2}} & = \Vel{mast}{hic2}
\end{align}

We will find it useful to express facts about containment
as relations among indexes of \var{mast}:
\begin{align}
\label{t:sequence-overlap-32}
& \var{a} \in \var{con} && \text{ASM Th} \\
\label{t:sequence-overlap-34}
& \var{loc} \le \var{aix} \le \var{hic} &&
\eqref{t:sequence-overlap-24},
\eqref{t:sequence-overlap-26},
\eqref{t:sequence-overlap-32}
\\
\label{t:sequence-overlap-36}
& \var{b} \in \var{con} && \text{ASM Th} \\
\label{t:sequence-overlap-38}
& \var{loc} \le \var{bix} \le \var{hic} &&
\eqref{t:sequence-overlap-24},
\eqref{t:sequence-overlap-26},
\eqref{t:sequence-overlap-36}
\end{align}

Assume for an inner reductio that
\begin{equation}
\label{t:sequence-overlap-50}
\var{aix} \le \var{bix}
\end{equation}
From \eqref{t:sequence-overlap-18},
\eqref{t:sequence-overlap-28},
\eqref{t:sequence-overlap-30}
and \eqref{t:sequence-overlap-50},
we have
\begin{equation}
\label{t:sequence-overlap-54}
\begin{gathered}
\var{loc2} \le \var{aix} \le \var{hic2} < \var{bix} \\
\therefore \; \var{aix} \le \var{hic2} < \var{bix}.
\end{gathered}
\end{equation}
Combining
\eqref{t:sequence-overlap-34}
\eqref{t:sequence-overlap-38}
and
\eqref{t:sequence-overlap-54},
we have
\begin{align}
\label{t:sequence-overlap-57}
& \var{loc} \le \var{aix} \le \var{hic2} < \var{bix} \le \var{hic} &&
\\
\label{t:sequence-overlap-59}
\therefore \; & \var{loc} \le \var{hic2} < \var{hic} &&
\\
\label{t:sequence-overlap-61}
\therefore \; & \el{con2}{\Vlastix{con2}} \in \var{con} &&
\eqref{t:sequence-overlap-24},
\eqref{t:sequence-overlap-26},
\eqref{t:sequence-overlap-30}
\end{align}
where
\eqref{t:sequence-overlap-61} is contrary
to assumption for theorem.
This shows the inner reductio,
from which we conclude that
\eqref{t:sequence-overlap-50} is false,
and therefore that
\begin{equation}
\label{t:sequence-overlap-70}
\var{aix} > \var{bix}
\end{equation}

Again using \eqref{t:sequence-overlap-18},
\eqref{t:sequence-overlap-28},
and \eqref{t:sequence-overlap-30},
but this time with \eqref{t:sequence-overlap-70},
we have
\begin{align}
\label{t:sequence-overlap-73}
& \var{bix} < \var{loc2} \le \var{aix} \le \var{hic2} \\
\label{t:sequence-overlap-75}
\therefore \; & \var{bix} < \var{loc2} \le \var{aix} \\
\label{t:sequence-overlap-77}
\therefore \; & \var{loc} \le \var{bix} \le \var{loc2} < \var{aix} \le \var{hic} &&
\eqref{t:sequence-overlap-34},
\eqref{t:sequence-overlap-38}
\\
\label{t:sequence-overlap-79}
\therefore \; & \var{loc} \le \var{loc2} < \var{hic} &&
\\
\label{t:sequence-overlap-81}
\therefore \; & \el{con2}{0} \in \var{con} &&
\eqref{t:sequence-overlap-24},
\eqref{t:sequence-overlap-26},
\eqref{t:sequence-overlap-28}
\end{align}
\eqref{t:sequence-overlap-81} is contrary to assumption for the theorem,
which shows the outer reductio and the theorem.
\end{proof}

\section{Grammars}

Where \Vsymset{syms} is non-empty set of symbols,
let $\var{syms}^\ast$ be the set of all strings
(type \dtype{STR}) formed
from those symbols.
Let $\var{syms}^+$ be
\begin{equation*}
\bigl\{ \Vstr{x}
\bigm| \Vstr{x} \in \var{syms}* \;\; \land \;\; \Vstr{x} \neq \epsilon
\bigr\}.
\end{equation*}

A grammar
is a 4-tuple:
\begin{equation*}
    (\Vsymset{nt}, \Vsymset{term}, \var{rules}, \Vsym{accept}).
\end{equation*}
\Vsymset{nt} is a set of symbols called non-terminals,
and \Vsymset{term} is a set of symbols called terminals.
Here $\Vsym{accept} \in \var{nt}$.
The vocabulary of the grammar is the union of
the sets of terminals and non-terminals:
\[ \Vsymset{vocab} = \Vsymset{nt} \cup \Vsymset{term}. \]
If a string of symbols contains only terminal symbols,
that string is called a \dfn{sentence}.
When a string contains only terminals, we also write its length
in symbols as
\Vsize{input}.%
\index{recce-notation}{\Pipe{}str\Pipe{}@\Vsize{str} (size of a string of terminals)}
The length of a string which contains non-terminals will be defined later,
when we discuss inputs.

\Vruleset{rules} is a set of rules (type \dtype{RULE}),
where a rule is a duple
of the form $[\Vsym{lhs} \de \Vstr{rhs}]$,
such that
\begin{equation*}
\Vsym{lhs} \in \var{nt} \quad \text{and}
\quad \Vstr{rhs} \in \var{vocab}^\ast
\end{equation*}
\Vsym{lhs} is referred to as the left hand side (LHS)
of \Vrule{r}.
\Vstr{rhs} is referred to as the right hand side (RHS)
of \Vrule{r}.
The LHS and RHS of \Vrule{r} may also be
referred to as
$\LHS{\Vrule{r}}$%
\index{recce-notation}{LHS(r)@\Vop{LHS}{rule}}
and
$\RHS{\Vrule{r}}$,%
\index{recce-notation}{RHS(r)@\Vop{RHS}{rule}}
and
respectively.

We will sometimes treat 
\RHS{\Vrule{r}} as a sequence,
so that
\Vel{\RHS{\Vrule{r}}}{i}%
\index{recce-notation}{RHS[r](ix)@\Vel{\RHS{\Vrule{r}}}{ix}}
to refer to the \var{i}'th RHS symbol instance
of \Vrule{r}.
For example,
\el{\RHS{\Vrule{r}}}{0} is the first
symbol instance on the RHS of \Vrule{r};
and
\el{\RHS{\Vrule{r}}}{2} is the third
symbol instance on the RHS of \Vrule{r}.

Where \Vrule{r} is a rule,
\Vsize{\Vrule{r}}%
\index{recce-notation}{\Pipe{}rule\Pipe{}@\Vsize{rule}!size of a RULE}
is the length of its RHS, in symbols;
and
\Vlastix{\Vrule{r}}%
\index{recce-notation}{#rule@\Vlastix{rule}!last index of the RHS of a RULE}
is equal to \Vlastix{\RHS{\Vrule{r}}}.
Therefore, the last symbol instance of the RHS of \Vrule{r}
may be referred to as any of
\begin{gather*}
\el{\RHS{\Vrule{r}}}{\Vlastix{\RHS{\Vrule{r}}}}, \\
\el{\RHS{\Vrule{r}}}{\Vlastix{\Vrule{r}}} \quad \text{or} \\
\el{\RHS{\Vrule{r}}}{(\Vdecr{\Vsize{\RHS{\Vrule{r}}}})}. \\
\end{gather*}

An alternative way of referring to the \var{i}'th RHS symbol instance
of \Vrule{r} is
\op{RHS}{\Vrule{r}, \var{i}}.%
\index{recce-notation}{RHS(r, ix)@\op{RHS}{\Vrule{r}, \var{ix}}}
We will write
\el{\RHS{\Vrule{r}}}{\var{a} \ldots \var{z}}
for the subsequence of RHS symbol instances
\[
    \el{\RHS{\Vrule{r}}}{\var{a}}, \;\;
    \el{\RHS{\Vrule{r}}}{\Vincr{a}}, \;\;
    \ldots \;\;
    \el{\RHS{\Vrule{r}}}{\var{z}}.
\]

The rules imply the traditional rewriting system.
We write
\begin{align*}
& \myparbox{%
$\Vstr{x} \derives \Vstr{y}$
to say that
\Vstr{x} derives \Vstr{y} in exactly one step.
}
\intertext{%
If a superscript is placed over the arrow,
it indicates
the number of derivation steps.
So we also write
}
& \myparbox{%
$\Vstr{x} \xderives{1} \Vstr{y}$
to say that
\Vstr{x} derives \Vstr{y} in one step;
} \\
& \myparbox{%
$\Vstr{x} \xderives{\var{n}} \Vstr{y}$
to say that
\Vstr{x} derives \Vstr{y} in \var{n} steps;
} \\
& \myparbox{%
$\Vstr{x} \xderives{0} \Vstr{y}$
is a derivation in zero steps;
} \\
& \myparbox{%
$\Vstr{x} \destar \Vstr{y}$
to say that
\Vstr{x} derives \Vstr{y} in zero or more steps;
and
} \\
& \myparbox{%
$\Vstr{x} \deplus \Vstr{y}$
to say that
\Vstr{x} derives \Vstr{y} in one or more steps.
}
\end{align*}

A derivation in zero steps,
is called a
\xdfn{trivial derivation}{trivial (derivation)}.
A symbol \Vsym{x} is
\xdfn{nullable}{nullable!in traditional parsing theory} if and only if
$\Vsym{x} \destar \epsilon$.
We say that symbol \Vsym{x} is
\xdfn{nulling}{nulling!in traditional parsing theory}
if and only if
\[
  \text{for all \Vstr{y}, if $\Vsym{x} \destar \Vstr{y}$,
  then $\Vstr{y} \destar \epsilon$.
  }
\]
A symbol is a
\xdfn{proper nullable}{proper nullable!in traditional parsing theory}
if it is nullable, but not nulling.
Note that,
following \cite[Vol. 1, p. 86]{AU1972},
\[
\text{%
  if $\Vstr{x} \destar \Vstr{y}$ then,
  for some \var{n}, $\var{n} \ge 0$,
  we have
  $\Vstr{x} \xderives{\var{n}} \Vstr{y}$
}
\]
and
\[
\text{%
if $\Vstr{x} \deplus \Vstr{y}$,
then for some \var{n},
$\var{n} \ge 1$, we have
$\Vstr{x} \xderives{\var{n}} \Vstr{y}$.
}
\]

\begin{definition}
\dtitle{Nulling strings}
We say that a string, call it \Vstr{x}, is
\xdfn{nulling}{nulling!STR},
if and only if
\[
\Vstr{x} \destar \epsilon.
\]
We say that a string, call it \Vstr{x}, is
\xdfn{nullable}{nullable!STR}
if and only if
\[
\text{%
  for all \Vstr{y}, if $\Vstr{x} \destar \Vstr{y}$,
  then $\Vstr{y} \destar \epsilon$.
}
\]
These definitions can be satisfied vacuously.
If \Vstr{x} is the empty string of symbols,
then \Vstr{x} is nullable.
And, if \Vstr{x} is the empty string of symbols,
then \Vstr{x} is nulling.
\end{definition}

The literature does not always distinguish between two
meanings of the term ``derivation step''.
It can sometimes mean a single string in a derivation,
and at other times means the action of one string
deriving another.
In this paper, we will say ``step'' to mean a single
string in a derivation,
and we will call the transition from one string to another,
a \dfn{derivation move} or, when it is clear in context,
a \dfn{move}.
For example,
\begin{equation}
\label{eq:def-move-1}
   \Vstr{x} \derives \Vstr{y},
\end{equation}
By ``step'' we mean
\Vstr{x} and \Vstr{y} considered separately,
so that there are two steps in
\eqref{eq:def-move-1}.
By ``move''
we mean \eqref{eq:def-move-1} considered as a whole,
so that
\eqref{eq:def-move-1} is a single ``move'',
with \Vstr{x} as its left side,
and
\Vstr{y} as its right side.

We say that \Vstr{desc} is a direct descendant of \Vsym{A} if
it is \Vstr{A-rhs} where $\Vsym{A} \de \Vstr{A-rhs}$ is a rule,
or if it is the empty string where \Vsym{A} is a nulling terminal.
We say that a derivation is \dfn{leftmost} if at each of its steps,
its leftmost nonterminal is replaced by one of its direct descendants.
We say that a derivation is \dfn{rightmost} if at each of its steps,
its rightmost nonterminal is replaced by one of its direct descendants.

When we want to make clear which step a symbol instance is from,
we will write $\var{si}@\var{x}$ to indicate
the symbol instance \Vinst{si} at Step \var{x}.
We will sometimes write the symbol instance using only
the symbol, in which case
$\var{A}@\var{x}$ will indicate
an instance of symbol \Vsym{A} at Step \var{x},
For example, let
\begin{equation}
\label{eq:symbol-step-instance-notation}
    \Vsym{A} \derives \Vsym{A}
\end{equation}
be a derivation,
where the left hand side of the derivation
in \eqref{eq:symbol-step-instance-notation}
is Step 1 of the derivation,
so that
the right hand side of the derivation
in \eqref{eq:symbol-step-instance-notation}
must be Step 2 of the derivation.
Then
$\var{A}@1$ indicates the instance of \Vsym{A} in Step 1,
and
$\var{A}@2$ indicates the instance of \Vsym{A} in Step 2,
so that
\begin{equation*}
\var{A}@1 \derives \var{A}@2
\end{equation*}
is equivalent to
\eqref{eq:symbol-step-instance-notation}.

Consider the derivation
\begin{equation}
\Vsym{A} \derives \Vstr{rhs} \destar \Vstr{left} \cat \Vsym{A} \cat \Vstr{right}
\end{equation}
We say that the rule $\Vsym{A} \de \Vstr{rhs}$
and the symbol \Vsym{A} are
\begin{center}
\begin{tabular}{ll}
\dfn{middle-recursive} & if
  \text{$\Vstr{left} \ndestar \epsilon$ and $\Vstr{right} \ndestar \epsilon$} \\
\dfn{left-recursive} &  if $\Vstr{left} \destar \epsilon$ \\
\dfn{right-recursive} &  if $\Vstr{right} \destar \epsilon$ \\
\dfn{cyclic} & if
  \text{$\Vstr{left} \destar \epsilon$ and $\Vstr{right} \destar \epsilon$}.
\end{tabular}
\end{center}

Except where otherwise stated,
our discussions in this monograph will
assume, without loss of generality,
a grammar of interest in that context,
\var{g}, such that
\begin{gather*}
    \var{g} = (\Vsymset{nt}, \Vsymset{term}, \var{rules}, \Vsym{accept}), \quad \text{where}
    \\
  \Vsymset{vocab} = \Vsymset{nt} \cup \Vsymset{term}.
\end{gather*}
The language of \var{g} is
\begin{equation}
\label{eq:def-L-g-10}
\myL{\Cg} \defined \left\lbrace
\Vstr{z} \mid \Vstr{z} \in \var{term}^\ast \land \Vsym{accept} \destar \Vstr{z}
\right\rbrace
\end{equation}
\Earley{} will refer to the Earley's original
recognizer~\cite{Earley1970}.
\Leo{} will refer to Leo's revision of \Earley{}
as described in~\cite{Leo1991}.
\Marpa{} will refer to the parser described in
this monograph.
Where $\alg{Recce}$ is a recognizer,
$\myL{\alg{Recce},\Cg}$ will be the language accepted by $\alg{Recce}$
when parsing \Cg{}.

TODO: Reviewed to HERE

\section{Marpa internal grammars}
Following Aycock and Horspool~\cite{AH2002},
Marpa grammars use a rewrite to eliminate proper nullables,
and nulling rules.
\begin{definition}
\dtitle{Marpa external and internal grammars}
\label{def:marpa-grammar}
The pre-rewrite grammar is called a
\dfn{Marpa external grammar},
or, more briefly,
an
\dfn{external grammar}.
The post-rewrite grammar is a
\dfn{Marpa internal grammar}%
\index{recce-definitions}{grammar, Marpa internal|mysee{Marpa internal grammar}}%
\index{recce-definitions}{grammar, internal|mysee{Marpa internal grammar}}
or, more briefly,
an
\xdfn{internal grammar}{internal grammar|mysee{Marpa internal grammar}}.

Because of the rewrite,
a Marpa internal grammar
\begin{itemize}
\item
has no nulling rules, and
\item
has no proper nullable symbols.
\end{itemize}
In the rest of this monograph,
when we refer to either a
\xdfn{grammar}{grammar|myixentry{defaulting to Marpa internal grammar}}
or a
\xdfn{Marpa grammar}{Marpa grammar|myixentry{defaulting to Marpa internal grammar}}%
\index{recce-definitions}{grammar, Marpa|myixentry{defaulting to Marpa internal grammar}}
we will mean a Marpa internal grammar,
unless otherwise stated.
\end{definition}

The external, pre-rewrite grammars
are the only ones visible to
the users of Marpa::R2.
The internal, post-rewrite grammars
are the ones actually used by the parse engine,
and therefore are
the ones described in this paper.
Details of this rewrite are given
in Chapter \ref{ch:rewrite}.

\begin{definition}
\dtitle{Telluric symbols and strings}
\label{def:telluric}
We say that
a symbol of a Marpa internal grammar is
\xdfn{telluric}{telluric!SYM}
if and only if it is non-nulling.
We say that a string is
\xdfn{telluric}{telluric!STR}
if and only if
the string contains a telluric symbol,
\end{definition}

We use
the term ``telluric'' only for Marpa internal grammars.
In Marpa internal grammars, we know that there
are no proper nullable symbols,
so that we 
can rely on
``telluric'' to be strict antonym of ``nullable''.
This is \textbf{not} the case for Marpa external grammars ---
non-nulling symbols of Marpa external grammars may be proper
nullables, so that ``non-nulling'' is not always
an antonym of ``nullable''.
We will make frequent use
of the fact that Marpa internal telluric symbols
are never nullable.
Calling such symbols ``telluric'' makes
it clear they have this property,
and will save us much confusion.
The term ``telluric'' originally means, roughly, ``of the earth''.
Later we will use it in contrast to the term
``ethereal''.

In the statement of the following theorems,
as in the rest of this monograph,
we will assume that we are speaking of Marpa internal grammars,
unless stated otherwise.

\begin{theorem}
\ttitle{Nullable symbol if and only if nulling}
\label{t:nullable-iff-nulling}
A symbol is nullable if and only if it is nulling.
\end{theorem}
\begin{proof}
For the purposes of this proof we read
\op{Nulling}{\Vsym{x}} as ``symbol \var{x} is nulling'',
and we read
\op{Nullable}{\Vsym{x}} as ``symbol \var{x} is nullable''.
Recall that, by default, we are speaking of Marpa internal
grammars.
No symbol in a Marpa internal grammar is a proper nullable,
that is,
\begin{align}
\label{eq:nullable-iff-nulling-10}
& \myparbox{%
there is no
\Vsym{s} such that
$\op{Nullable}{\Vsym{s}} \land \neg \op{Nulling}{\Vsym{s}}$
\becuz{}
\dref[Marpa internal grammar]{def:marpa-grammar},
} \\
\label{eq:nullable-iff-nulling-12}
& \myparbox{%
For all \Vsym{s},
$\neg \op{Nullable}{\Vsym{s}} \lor \op{Nulling}{\Vsym{s}}$
\becuz{}
\eqref{eq:nullable-iff-nulling-10}.
} \\
\label{eq:nullable-iff-nulling-14}
& \myparbox{%
For all \Vsym{s},
$\op{Nullable}{\Vsym{s}} \implies \op{Nulling}{\Vsym{s}}$
\becuz{}
\eqref{eq:nullable-iff-nulling-12}.
} \\
\label{eq:nullable-iff-nulling-16}
& \myparbox{%
For all \Vsym{s},
$\op{Nulling}{\Vsym{s}} \implies \op{Nullable}{\Vsym{s}}$
\becuz{}
Def of nulling and nullable for symbols.
} \\
\label{eq:nullable-iff-nulling-18}
& \myparbox{%
For all \Vsym{s},
$\op{Nulling}{\Vsym{s}} \iff \op{Nullable}{\Vsym{s}}$
\becuz{}
\eqref{eq:nullable-iff-nulling-14},
\eqref{eq:nullable-iff-nulling-16},
which shows the theorem.
\qedhere
}
\end{align}
\end{proof}

\begin{theorem}
\ttitle{Telluric is not nullable}
\label{t:telluric-iff-non-nullable}
A symbol is telluric,
if and only if
it is both non-nulling and non-nullable.
\end{theorem}
\begin{proof}
For the purposes of this proof,
we write \op{Telluric}{\Vsym{x}}
to say that ``symbol \var{x} is telluric'';
\op{Nulling}{\Vsym{x}}
to say that ``symbol \var{x} is nulling'';
and \op{Nullable}{\Vsym{x}}
to say that ``symbol \var{x} is nullable''.
\begin{align}
\label{eq:telluric-non-nullable-10}
& \myparbox{%
For all \Vsym{s},
$\op{Telluric}{\Vsym{s}}
\iff
\op{Nulling}{\Vsym{s}}$
\becuz{}
\dref[telluric]{def:telluric}.
} \\
\label{eq:telluric-non-nullable-12}
& \myparbox{%
For all \Vsym{s},
$\op{Nullable}{\Vsym{s}}
\iff
\op{Nulling}{\Vsym{s}}$
\becuz{}
\eqref{eq:telluric-non-nullable-10},
\tref{t:nullable-iff-nulling}.
}
\end{align}
Equations
\eqref{eq:telluric-non-nullable-10}
and
\eqref{eq:telluric-non-nullable-12}
show the theorem.
\end{proof}

\begin{theorem}
\ttitle{Telluric string if and only if nullable}
\label{t:telluric-string-iff-nullable}
A string is telluric if and only if
it is both non-nullable and non-nulling.
\end{theorem}
\begin{proof}
Assume for a reduction that \Vstr{tell}
is a telluric string.
Then
\begin{equation}
\label{eq:telluric-string-iff-nullable-5}
\myparbox{%
\Vstr{tell} contains a telluric symbol,
call it \Vsym{tell}
\becuz{}
\dref[telluric string]{def:telluric}.
}
\end{equation}
Assume for a reductio,
that \Vstr{tell} is nullable,
so that, without loss of generality,
\begin{subequations}
\renewcommand{\theequation}{RAD-\arabic{equation}}
\setlength{\mathparwidth}{\dimexpr\mathparwidth-2em}
\begin{align}
\label{eq:telluric-string-iff-nullable-10}
\myparbox{%
$\Vstr{tell} = \Vstr{pre} \Vsym{tell} \Vstr{post}
\derives \epsilon$.
} \\
\label{eq:telluric-string-iff-nullable-12}
\myparbox{%
$\Vsym{tell} \derives \epsilon$
\becuz{}
\eqref{eq:telluric-string-iff-nullable-10}.
} \\
\label{eq:telluric-string-iff-nullable-14}
\myparbox{%
\Vsym{tell} is nullable
\becuz{}
\eqref{eq:telluric-string-iff-nullable-12}.
} \\
\label{eq:telluric-string-iff-nullable-16}
\myparbox{%
\Vsym{tell} is not nullable
\becuz{}
\eqref{eq:telluric-string-iff-nullable-5},
\tref{t:telluric-iff-non-nullable}.
}
\end{align}
\end{subequations}

Equations
\eqref{eq:telluric-string-iff-nullable-14}
and \eqref{eq:telluric-string-iff-nullable-16}
show the reductio.
From the reductio,
we conclude that
\begin{align}
\label{eq:telluric-string-iff-nullable-18}
& \myparbox{%
\Vstr{tell} is not nullable.
}
\end{align}

TODO: finish
\end{proof}

\begin{theorem}
All LHS symbols are telluric.
\end{theorem}
\begin{proof} TODO \end{proof}

\begin{theorem}
All nullable symbols are terminals.
\end{theorem}
\begin{proof} TODO \end{proof}

\begin{theorem}
A string is derived from a telluric string
if and only if
it contains at least one telluric symbol.
\end{theorem}
\begin{proof} TODO \end{proof}

\begin{theorem}
A string is derived from a telluric string
if and only if it is telluric.
\end{theorem}
\begin{proof} TODO \end{proof}

\begin{theorem}
A sentence is derived from a telluric string
if and only if
it has an input length of at least one.
\end{theorem}
\begin{proof} TODO \end{proof}

Since there are no nulling rules in Marpa's internal grammars,
a symbol is never nulled as the result of a derivation step.
Therefore, where \Vsym{nulling} is a nulling symbol,
\begin{align*}
    \Vsym{nulling} & \nderives{1} \epsilon \quad \text{and} \\
    \Vsym{nulling} & \ndeplus \epsilon.
\end{align*}
Strictly speaking, it is not wrong to say that
\begin{align*}
    \Vsym{nulling} & \xderives{0} \epsilon \quad \text{or} \\
    \Vsym{nulling} & \destar \epsilon
\end{align*}
although it is misleading,
and we avoid it in favor of
\[
    \Vsym{nulling} = \epsilon,
\]
which more clearly conveys what it means for a
Marpa internal symbol to be ``nulling''.

\begin{definition}
\dtitle{Accept rule and symbol}
\label{def:accept-rule-and-symbol}
A Marpa internal grammar always has
a dedicated acceptance rule, \Vrule{accept}
and a dedicated acceptance symbol,
\[
  \Vsym{accept} = \LHS{\Vrule{accept}},
\]
such that
for all \Vrule{x},
\[
\Vsym{accept} \notin \RHS{\Vrule{x}}
\]
and
\[
\Vsym{accept} = \LHS{\Vrule{x}} \implies \Vrule{accept} = \Vrule{x}.
\]
\end{definition}

We assume that a Marpa grammar is cycle-free ---
that none of its rules are cyclic.
We assume that every symbol is productive ---
that is, that it derives a sentence.
We assume that every symbol is accessible ---
that is, that it is derivable from the start symbol.

\section{Input}

Let the actual input to
the parse be \Cw{} such that $\Cw \in \myL{\Cg}$.
Locations in the input will be of type \dtype{LOC}.
Let \Vsize{w}%
\index{recce-notation}{\Pipe{}input\Pipe{}@\Vsize{input} (size of an input)}
be the length of the input, counted in symbols.
When we state our complexity results later,
they will often be in terms of $\var{n}$,
where $\var{n} = \Vsize{w}$.
Let \CVw{i} be character
at position \var{i}
of the input.
String position is zero-based,
so that
$0 \le \Vloc{i} < \Vsize{w}$.
Let $\var{w}[\var{a}, \var{b}]$
be the contiguous substring
from position \var{a} to
position \var{b}, inclusive,
so that
\[ \bigsize{\var{w}[\var{a}, \var{b}]} = (\var{b} \subtract \var{a}) + 1. \]

Our definition
of \Cw{} does not allow zero-length inputs.
The Marpa parser
deals with null parses
and nulling grammars as special cases,
and this monograph will not consider them.
(Nulling grammars are those that recognize only the null string.)

Parsers typically do work while examining their input,
so that they are, in effect, working with a set of possible inputs,
of which the actual input is just one element.
Reasoning about the set of inputs possible based on what has been
seen so far plays little role in
traditional deterministic parsers,
which do limited tracking
of input already seen,
and have even less of an idea of the inputs not yet seen.
But Marpa is left-eidetic ---
it has a full, exact idea of the input already seen ---
and Earley parsers
also have a very exact idea of what the unseen portion of the input
could be.

We will call the current set of inputs, \CW{}.
\CW{} will always be such that
\begin{equation*}
\Cw \in \CW \quad \text{and} \quad \CW{} \subseteq \myL{\Cg}.
\end{equation*}
We say that \CW{} is
\xdfn{seen from}{seen from \var{i} to \var{j}!wrt an input set}
\Vloc{i} to \Vloc{j} if and only if,
for all \Vstr{w1}, \Vstr{w2}
\begin{equation*}
\Vstr{w1} \in \CW \land \Vstr{w2} \in \CW
\implies
\el{w1}{\var{i}, \, (\Vdecr{j}) \, } =
\el{w2}{\var{i}, \, (\Vdecr{j}) \, }.
\end{equation*}

Most parsing, including Earley parsing, takes place from left-to-right,
and Marpa examines its input from left to right.
We say that
\CW{} is
\xdfn{seen to}{seen to \var{j}!wrt a input set}
\var{j},
or that
\CW{} is
\xdfn{seen as far as}{seen as far as \var{j}!wrt an input set}
\var{j},
if \CW{} is seen between locations 0 and \Vloc{j}.
In this monograph we will usually speak of input sets that are seen
as far as some \Vloc{j}.
If \CW{} is seen to location 0, none of its input symbols have been
seen.
If \CW{} is seen to location \Vsize{\Cw},
where \Cw{} is the actual input,
then
$\CW = \lbrace \Cw \rbrace$,
and all of its input symbols
have been seen.
In most contexts, the current set of inputs will be assumed to be \CW{}.
For example,
instead of saying that \CW{} is seen as far as \Vloc{k},
we may say the ``the input is seen as far as \Vloc{k}''.

We will say that a derivation is
\xdfn{fully seen}{fully seen!wrt a derivation},
or more simply
\xdfn{full}{full!wrt a derivation},
if its last step is \Cw{}.
Intuitively, a \dfn{symbol instance} is
a symbol in the context of a parse.
In a fully seen derivation,
the right and left locations are well-defined
for every symbol instance of every step.

More formally,
a symbol instance is a triple whose elements
are a left location, a symbol name and a right location.
We often represent symbol instances in the form
\begin{equation*}
\Vinst{inst} = \Vmkl{j} \Vsym{up} \Vmkr{k}.
\end{equation*}%
\index{recce-notation}{[]inst[]@\Vmkl{j} \Vsym{up} \Vmkr{k} (symbol instance)}
\Vmk{j} and \Vmk{k} are always optional.
We also write
\begin{itemize}
\item
\Left{\Vinst{inst}}%
\index{recce-notation}{Left(x)@\Left{\Vinst{inst}}}
for \var{j},
the left location of \Vinst{inst};
\item
\Right{\Vinst{inst}}%
\index{recce-notation}{Right(x)@\Right{\Vinst{inst}}}
for \var{k},
the right location of \Vinst{inst};
\item
\Symbol{\Vinst{inst}}%
\index{recce-notation}{Symbol(x)@\Symbol{\Vinst{inst}}}
for \Vsym{up},
the symbol name of \Vinst{inst};
\item
\Vsize{\Vsym{inst}}%
\index{recce-notation}{\Pipe{}inst\Pipe{})@\Vsize{\Vinst{inst}}}
for \xxsubtract{\var{k}}{\var{j}},
the length of \Vinst{inst} in terms of input symbols; and
\item
\Vsize{\Vsym{A}}%
\index{recce-notation}{\Pipe{}sym\Pipe{})@\Vsize{\Vsym{A}}}
for \Vsize{\Vinst{inst}},
where $\Symbol{\Vinst{inst}} = \Vsym{A}$,
and the left and right locations of \Vinst{inst}
are understood from the context.
\end{itemize}

When \Vstr{si} is a sequence of symbol instances of length \Vsize{si}
whose indexes are 0 \ldots{} \var{last},
we will write
\Symbol{\Vstr{si}}%
\index{recce-notation}{Symbol(str)@\Symbol{\Vstr{str}}}
for
\begin{equation*}
\Symbol{\el{si}{0}}, \;\;
\Symbol{\el{si}{1}}, \;\;
\ldots \;\;
\Symbol{\Vel{si}{last}}.
\end{equation*}
We will write \Vsize{\Vstr{si}}%
\index{recce-notation}{\Pipe{}str\Pipe{})@
  \Vsize{\Vstr{str}} (length of a sentential form in terms of the input)}
for
\begin{equation*}
\sum_{\var{i}=0}^\var{last} \Symbol{\Vel{si}{i}}.
\end{equation*}
Note that \Vsize{\Vstr{si}} is the length of the string
in terms of input symbols, and is, in general,
not a count of the
symbols in \Vstr{si}.

At some points, such as when we translate a derivation
to other notation,
we will want to justify the conversion to and from
a derivation carefully.
To do this, we will treat a derivation as a two-dimensional
ragged array.
The rows will be derivation steps,
and the columns of these variable-length rows will be symbol
instances.
We will write \drvVV{d}{s}{i} for
the \var{i}'th symbol instance of the \var{s}'th step
of the derivation \var{d}.
Steps will be numbered from 0, starting at the root.
Symbol instances will be numbered from 0, starting at the left.

Let \var{d} be a fully seen derivation,
and let $\var{wlen} = \Vsize{\Cw}$.
For every \var{d}, we will have
\begin{equation}
\drv{d}{0}{0} = \mk{0} \Vsym{accept} \Vmk{wlen}
\end{equation}
and where the length of the derivation is \var{dlen},
for all \var{a} such that $0 \le \var{a} < \var{wlen}$,
\[
  \drv{d}{\Vdecr{dlen}}{\var{a}} = \Vinst{a} = \Vmk{a} \Vsym{a} \mk{\Vincr{a}}.
\]
where \Vsym{a} is $\Cw[\var{a}]$,
the symbol at location \Vloc{a} of the input.

We will use type \dtype{STR} for sequences of symbol instances
as well as symbols.
We write \Vel{s1}{i} to refer
to refer to the \var{i}'th symbol or symbol instance
in a string,
where the first symbol or symbol instance is at
\el{s1}{0}.
We write \el{s1}{\var{i} \ldots \var{j}} to refer
to the contiguous substring of \Vstr{s1} which starts with
\Vel{s1}{i} and ends with \Vel{s1}{j}.
The range is inclusive, so that
the length of \el{s1}{\var{i} \ldots \var{j}}
is $(\xxsubtract{\var{j}}{\var{i}})+1$.
We will find it convenient to write
\drv{d}{\var{s}}{\var{a} \ldots \var{z}}
for the sequence of symbol instances
\[
    \drvVV{d}{s}{a}, \;\;
    \drv{d}{\var{s}}{\Vincr{a}}, \;\;
    \ldots \;\;
    \drvVV{d}{s}{z}
\]

\section{Focused derivations}

We now
recall our previous definition of a rightmost
derivation.
Following ~\cite[Vol. 1, page 141, Lemma 2.12]{AU1972},
a rightmost derivation is defined in terms of a series of
expansions of a derivation tree, beginning at the root.
A rightmost derivation is one that always expands the rightmost
non-terminal into its direct descendants.

\begin{definition}
\dtitle{Focused derivation}
We say that the derivation \var{d}
is
\xdfn{focused}{focused (derivation)}
at \Vloc{k},
if \CW{} is seen to \Vloc{k},
and
if in every step \var{s},
\begin{itemize}
\item
if there is a non-terminal symbol instance
$\Vinst{ki} = \drvVV{d}{s}{x}$
such that $\Left{\Vinst{ki}} \le \Vloc{k} < \Right{\Vinst{ki}}$,
\var{d} expands
\drvVV{d}{s}{x}; and
\item
otherwise, \var{d} expands the rightmost non-terminal symbol
instance.
\end{itemize}
We say that \var{d} is
\xdfn{focused within}{focused within!wrt a symobl instance and a derivation}
a symbol instance \Vinst{si}
if and only if it is
focused at some \Vloc{k} such
tha
\[
\Left{\var{si}} \le \Vloc{k} < \Right{\var{si}}.
\]
We say that \var{d} i
\xdfn{focused within}{focused within!wrt an EIM and a derivation}
\Veim{eim}
if and only if it is
focused at some \Vloc{k} such that
\[
\Left{\LHS{\Veim{eim}}} \le \Vloc{k} < \Right{\LHS{\Veim{eim}}}.
\]
\end{definition}

Recall from parsing theory that every derivation has an equivalent rightmost
derivation, and that the rightmost derivation is unique in its derivation
tree.
Similarly, for every \Vloc{k},
every derivation which is seen to \Vincr{k}
has an equivalent derivation that is focused at \Vloc{k},
and that \Vloc{k}-focused derivation is unique in its
derivation tree.

\begin{theorem}
\ttitle{Properties of focused derivations}
\label{t:focusing-props}
Let \var{d} be a derivation focused within
the symbol instance
\Vinst{i1}, where
\Vinst{i1} is at derivation step \var{s},
and \Symbol{\var{i1}} is
a non-terminal other than \Vsym{accept}.
Then \Vinst{i1} is a direct descendant
of a symbol instance \Vinst{i2},
such that
\begin{gather}
\label{eq:focusing-props-10}
\text{\var{i2} is at derivation step \Vdecr{s},} \\
\label{eq:focusing-props-13}
\text{\Symbol{\var{i2}} is a non-terminal,} \\
\label{eq:focusing-props-16}
\Right{\var{i2}} \ge \Right{\var{i1}}, \\
\label{eq:focusing-props-19}
\Left{\var{i2}} \le \Left{\var{i1}}, \\
\label{eq:focusing-props-22}
\text{and \var{d} is focused within \var{i2}.}
\end{gather}
In addition,
for some \Vstr{pre}, \Vstr{post},
where $\Symbol{\var{i1}} = \Vsym{i1}$ and
$\Symbol{\var{i2}} = \Vsym{i2}$,
\begin{equation}
\label{eq:focusing-props-25}
[\Vsym{i2} \de \Vstr{pre} \Vsym{i1} \Vstr{post} ] \in \Crules,
\end{equation}
and
\begin{equation}
\label{eq:focusing-props-27}
\begin{aligned}
& \Vsym{i2} && \text{Step \Vdecr{s}} \\
\derives \quad & \Vstr{pre} \Vsym{i1} \Vstr{post} \qquad && \text{Step \var{s}}
\end{aligned}
\end{equation}
\end{theorem}

\begin{proof}
Since \Vinst{i1} is not the accept symbol,
there is a derivation step \Vdecr{s}.
In each derivation step, a symbol instance is either
copied over into the next step or expanded into
its direct descendants.
Therefore,
in step \Vdecr{s}, there is either another copy of symbol
instance \Vinst{i1}, or \Vinst{i1} is the direct descendent
of another symbol instance.
Either way, call that other symbol instance, \Vinst{i2}.
\Vinst{i2} is in derivation step
\Vdecr{s} by definition, which gives us
\eqref{eq:focusing-props-10}.

We show
\eqref{eq:focusing-props-16}
and
\eqref{eq:focusing-props-19}
by cases.
In the first case, where \Vinst{i1} is a direct descendant
of \Vinst{i2}, we recall that
\begin{equation}
\label{eq:focusing-props-29}
\myparbox{
In every parse using a context-free grammar,
the right and left locations of
a direct descendant are always inside
of the single symbol from which the
direct descendant was expanded.
}
\end{equation}
The input may not have been seen to \Right{\var{i2}},
but
\eqref{eq:focusing-props-30}
is true of all factorings of all inputs,
and we may conclude that
\eqref{eq:focusing-props-16}
and
\eqref{eq:focusing-props-19}
hold for every input in \CW{}.
If \Vinst{i1} is a copy of \Vinst{i2},
\eqref{eq:focusing-props-16}
and
\eqref{eq:focusing-props-19}
follow trivially.

By assumption, \var{d} is focused within \Vinst{i1},
and therefore at some \Vloc{k} such that
\begin{equation}
\label{eq:focusing-props-30}
\Left{\var{i1}} \le \Vloc{k} < \Right{\var{i1}}.
\end{equation}
\eqref{eq:focusing-props-22}
follows from
\eqref{eq:focusing-props-16},
\eqref{eq:focusing-props-19}
and
\eqref{eq:focusing-props-30}.

We show \eqref{eq:focusing-props-13}
by cases.
In the first case,
\Vinst{i2} is a copy of \Vinst{i1}
so that
$\Symbol{\var{i2}} = \Symbol{\var{i1}}$,
and since
\Symbol{\var{i1}} is a non-terminal,
\Symbol{\var{i2}} is a non-terminal.
In the second case,
\Vinst{i2} is not a copy of \Vinst{i1},
so that \Vinst{i1} is a direct descendant of
\Vinst{i2}.
In this second case,
\Vinst{i2} is a non-terminal
by definition.
This gives us both cases,
and
\eqref{eq:focusing-props-13}.

We have already shown
\eqref{eq:focusing-props-13}
and
\eqref{eq:focusing-props-22},
so we know that,
by the definition of a focused derivation,
\Vinst{i2} is expanded into
its direct descendants in step \var{s}.
\eqref{eq:focusing-props-25}
and \eqref{eq:focusing-props-27}
follow from this observation and the definition
of a derivation.

For convenience the step numbers are shown in
\eqref{eq:focusing-props-27}.
The labeling of Step \var{s} follows from assumption
for the theorem.
The labeling of Step \Vdecr{s} follows from
\eqref{eq:focusing-props-10}.
\end{proof}

\section{Location markers}

\subsection{Definition}

In the context of a grammar \Cg{} and an input \Cw{},
we will often use location-marked derivations.
Location-marked derivation steps are like the derivation steps
of the traditional rewriting system except that they also contain
location markers of the form \Vmk{x}, where \var{x} is a
location in \Cw{}.\footnote{
Our use of the location marker notation
was inspired by~\cite{Wich2005}.}
When not otherwise stated,
use of the location marker \Vmk{x}
implies that \CW{} has been seen to \Vmk{x}.
In its most general form,
a derivation step with a single location marker is
\begin{equation}
\label{eq:location-marker-def-2}
\Vstr{pre} \Vmkm{x} \Vstr{post}.
\end{equation}
\eqref{eq:location-marker-def-2}
means
\begin{equation*}
\begin{split}
&  \Vsym{accept} \destar \Vstr{before} \cat \Vstr{pre} \cat \Vstr{post} \cat \Vstr{after} \\
&  \land \quad \Vstr{before} \cat \Vstr{pre} \destar \var{w}[0, (\Vdecr{x})] \\
&  \land \quad \Vstr{post} \cat \Vstr{after} \destar \var{w}[\var{x}, (\Vsize{\Cw} \subtract 1)]
\end{split}
\end{equation*}

Derivations may have many location markers.
The meaning of a derivation with \var{j} different location markers,
\[ \var{m}[1], \var{m}[2] \ldots \var{m}[\var{j}], \]
is the same as the meaning of the conjunction of an ordered set of \var{j} derivations,
where the \var{i}'th member has all the markers removed except for $\var{m}[\var{i}]$.
For example,
\begin{equation}\label{eq:location-marker-def-11}
\begin{split}
&  \Vsym{accept} \destar \Vstr{before} \Vmkm{i} \Vsym{A} \cat \Vstr{after} \\
&  \qquad \derives \Vstr{before} \Vmkm{i} \Vstr{predot} \Vmkm{j} \Vstr{postdot} \cat \Vstr{after}.
\end{split}
\end{equation}
is the equivalent of the logical conjunction of two derivations:
\begin{gather}
\label{eq:location-marker-def-12}
\begin{split}
&  \Vsym{accept} \destar \Vstr{before} \,[\var{i}]\, \Vsym{A} \cat \Vstr{after} \\
&  \qquad \derives \Vstr{before} \,[\var{i}]\, \Vstr{predot} \Vstr{postdot} \cat \Vstr{after}
\end{split} \\
\intertext{and}
\label{eq:location-marker-def-13}
\begin{split}
&  \Vsym{accept} \destar \Vstr{before} \cat \Vsym{A} \cat \Vstr{after} \\
&  \qquad \derives \Vstr{before} \cat \Vstr{predot} \,[\var{j}]\, \Vstr{postdot} \cat \Vstr{after}.
\end{split}
\end{gather}
In this example,
\eqref{eq:location-marker-def-12} and
\eqref{eq:location-marker-def-13}
imply that
\begin{equation}\label{eq:location-marker-def-14}
\Vstr{predot} \destar \var{w}[\var{i}, (\var{j} \subtract 1)]
\end{equation}
and therefore
\eqref{eq:location-marker-def-11}
also implies
\eqref{eq:location-marker-def-14}.
Derivations with location markers may be
composed in the same way as derivations without them,
as long as the location markers in the combined
derivation are consistent.

\subsection{Transformations}

The location marker notation is intuitive and based on the
traditional notation for derivations,
but, since it is new, we will present examples.
For the examples of this section,
we
start with the traditional derivation
\begin{gather*}
\Vstr{A} \\
\derives \Vstr{Aa} \Vsym{B} \Vsym{D} \Vstr{Aa} \\
\derives \Vstr{Aa} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vsym{D} \Vstr{Az}
\end{gather*}

\textbf{Insert new location markers}:
If a location marker is not currently used, we can insert it
to mark any location that has been seen.
In this example,
we insert
new markers
\Vmk{i}, \Vmk{j}, \Vmk{k}, \mk{\ell} and \Vmk{m}:
\begin{gather*}
\Vstr{A} \\
\derives \Vmk{i} \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Aa} \Vmk{m} \\
\derives \Vstr{Aa} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vsym{D} \Vstr{Az}
\end{gather*}

Introduction of a location marker \Vmk{x}, unless otherwise stated,
assumes that the \CW{} has been seen to \Vmk{x},
so in this example, we assumed that input has been seen to
the rightmost marker, \Vmk{m}.
The examples to follow deal with movement of existing
location markers, so that it will have already been assumed
that \CW{} has been seen as far as those location markers.

\textbf{Move location markers from direct descendants to their parents}:
If a location marker is before the first of its direct descendants, we can move
it to before its parent in the previous step.
In this example, \Vmk{i} is moved:
\begin{gather*}
\Vmk{i} \Vstr{A} \\
\derives \Vmk{i} \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Aa} \Vmk{m} \\
\derives \Vstr{Aa} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vsym{D} \Vstr{Az}
\end{gather*}
Also, if a location marker is after the last of its direct desendants,
we can move it to after its parent in the previous step.
In this example, \Vmk{m} is moved:
\begin{gather*}
\Vmk{i} \Vstr{A} \Vmk{m} \\
\derives \Vmk{i} \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Aa} \Vmk{m} \\
\derives \Vstr{Aa} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vsym{D} \Vstr{Az}
\end{gather*}

\textbf{Move location markers from parents to direct descendants}:
Similarly if a location marker is before a parent, we can
move it to before the first of its direct descendants in the next step;
and,
if a location marker is after a parent, we can
move it to after the last of its direct descendants in the next step.
In this example, \Vmk{j} and \Vmk{k} are moved:
\begin{gather*}
\Vmk{i} \Vstr{A} \Vmk{m} \\
\derives \Vmk{i} \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Az} \Vmk{m} \\
\derives \Vstr{Aa} \Vmk{j} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vmk{k} \Vsym{D} \Vstr{Az}
\end{gather*}

\textbf{Delete location markers}:
Location markers which are no longer of interest may be removed.
In this example, \Vmk{i} and \Vmk{m} are deleted:
\begin{gather*}
\Vstr{A} \\
\derives \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Az} \\
\derives \Vstr{Aa} \Vmk{j} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vmk{k} \Vsym{D} \Vstr{Az}
\end{gather*}

\textbf{Move location marker to before or after same symbol instance}:
A location marker which is before (after) a symbol instance in one derivation
step may be moved to before (after) the same symbol instance in another derivation step.
In this example, \mk{\ell} is moved:
\begin{gather*}
\Vstr{A} \\
\derives \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Az} \\
\derives \Vstr{Aa} \Vmk{j} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Az}
\end{gather*}

\textbf{Simplification}:
A derivation may be simplified from the bottom up,
by removing the symbol instances outside of two markers.
In this example, the last step is simplified outside of \Vloc{j} and \Vloc{k}:
\begin{gather*}
\Vstr{A} \\
\derives \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Az} \\
\derives \ldots \Vmk{j} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vmk{k} \ldots
\end{gather*}
When it is clear what is happening, the dots may be omitted:
\begin{gather*}
\Vstr{A} \\
\derives \Vstr{Aa} \Vmk{j} \Vsym{B} \Vmk{k} \Vsym{D} \mk{\ell} \Vstr{Az} \\
\derives \Vmk{j} \Vstr{Ba} \Vsym{C} \Vstr{Bz} \Vmk{k}
\end{gather*}

\textbf{Null passing}:
A location marker may be duplicated from one side of a nulling symbol
to the other.
For this example,
assume that
$\Vstr{nul1} = \epsilon$,
$\Vstr{tel1} \neq \epsilon$,
and
$\Vstr{tel2} \neq \epsilon$.
In
\begin{equation}
\Vstr{tel1} \Vmk{x} \Vstr{nul1}  \Vstr{tel2},
\end{equation}
we can duplicate the \Vmk{x}
\begin{equation}
\Vstr{tel1} \Vmk{x} \Vstr{nul1} \Vmk{x} \Vstr{tel2}.
\end{equation}
If one of the two \Vmk{x} markers is now clutter,
we may also delete it:
\begin{equation}
\Vstr{tel1} \Vstr{nul1} \Vmk{x} \Vstr{tel2}.
\end{equation}

\subsection{Simplification and nulling symbols}

Caution must be exercised because nulling symbols
can fall on either side of a location-marker.
The following theorem shows that what looks like a cycle
in location-marked notation is,
in fact, a cycle,
and therefore cannot occur in Marpa grammar.

\begin{theorem}
\ttitle{Location marked cycles}
\label{t:location-marker-cycle}
Let \Vstr{sf} be a sentential form containing at
least one telluric symbol.
Then
\begin{equation}
\label{eq:location-marker-cycle-10}
  \Vmk{i} \Vstr{sf} \Vmk{j} \ndeplus \Vmk{i} \Vstr{sf} \Vmk{j}
\end{equation}
\end{theorem}

\begin{proof}
We represent
the possible nulls
outside our location markers in
\eqref{eq:location-marker-cycle-10}
in full generality as
\begin{align}
\label{eq:location-marker-cycle-12}
& \Vstr{nul1L} \Vmk{i} \Vstr{sf} \Vmk{j} \Vstr{nul1R} && \text{Step \var{x}} \\
\label{eq:location-marker-cycle-14}
  \deplus & \Vstr{nul2L} \Vmk{i} \Vstr{sf} \Vmk{j} \Vstr{nul2R}. && \text{Step \var{y}}
\end{align}
where
$\Vstr{nul1L} = \Vstr{nul1R} = \Vstr{nul2L} = \Vstr{nul2R} = \epsilon$.
We assume
\eqref{eq:location-marker-cycle-12}--\eqref{eq:location-marker-cycle-14}
for an outer reductio.

By assumption for the theorem there is at least
one telluric symbol in \Vstr{sf}.
Let \Vsym{tell} be one of those telluric symbols in Step \var{x},
and let \Vsym{descs} be its descendants in Step \var{y}.

We will write \Vop{T}{x} for the number of telluric symbols in \Vstr{x}
or \Vsym{x}.
No telluric symbol is nulling, so that
$\bigop{T}{\Vsym{tell}} \le \bigop{T}{\Vstr{dd}}$,
and therefore
$\bigop{T}{\Vstr{dd}} \ge 1$.

Assume for an inner reductio, that
there is some \Vsym{tell2} in
Step \var{x} of
\Vstr{sf},
such that $\bigop{T}{\Vstr{descs2}} > 1$,
where \Vstr{descs2} are the descendants of \Vsym{tell2}
in Step \var{y}.

Let \var{tell-cnt} be the number of telluric symbols in
\eqref{eq:location-marker-cycle-12}:
\[
\var{tell-cnt} =
\bigop{T}{ \Vstr{nul1L} } +
\bigop{T}{ \Vstr{sf}@\var{x}} +
\bigop{T}{ \Vstr{nul1R} }.
\]
Since $\Vstr{nul1L} = \Vstr{nul1R} = \epsilon$,
we have
$\var{tell-cnt} = \bigop{T}{\Vstr{sf}@\var{x}}$.
We have
\begin{equation}
\label{eq:location-marker-cycle-17}
\var{tell-cnt} = \bigop{T}{\Vstr{sf}@\var{x}}
= \bigop{T}{\Vstr{sf}@\var{y}}
\end{equation}
by the self-identity of \Vstr{sf}.

$\Vstr{nul2L} = \Vstr{nul2R} = \epsilon$,
so that if there is any
telluric symbol
in Step \var{y},
it will be in
$\var{sf}@\var{y}$.
Using
\eqref{eq:location-marker-cycle-17}
we see that if one telluric symbol in $\var{sf}@\var{x}$
derives
\var{n} telluric symbols in $\var{sf}@\var{y}$,
then the other $\Vdecr{tell-cnt}$ telluric symbols
in
$\var{sf}@\var{x}$ must derive
\xxsubtract{\var{tell-cnt}}{\var{n}}
telluric symbols.
This means that, if $\var{n} > 1$,
at least one telluric symbol in
$\var{sf}@\var{x}$
derives
zero telluric symbols in $\var{sf}@\var{y}$.
In other words,
if $\var{n} > 1$,
at least one telluric symbol in
$\var{sf}@\var{x}$ must be nulling.

But telluric symbols are never nulling,
which shows the inner reductio.
We conclude from the inner reductio that
no telluric symbol in
$\bigop{T}{\Vstr{sf}@\var{x}}$
derives more than one telluric symbol in
$\bigop{T}{\Vstr{sf}@\var{y}}$.

We have already shown that every telluric symbol in
Step \var{x}
derives at least one telluric symbol in Step \var{y}.
So we have that,
\begin{equation}
\label{eq:location-marker-cycle-20}
\myparbox{
for any telluric symbol
$\Vsym{tell2}@\var{x}$,
if \Vstr{descs2}@\var{y} are its direct descendants in
Step \var{y},
then $\bigop{T}{\Vstr{descs2}@\var{y}} = 1$.
}
\end{equation}

Recall our earlier assumption
in the outer reductio
that \Vsym{tell} is an arbitrary
telluric symbol in \var{sf}@\var{x}
and
\var{descs}@\var{y}
are its descendants.
We know from
\eqref{eq:location-marker-cycle-20}
that
$\bigop{T}{\Vstr{descs}@\var{y}} = 1$.
That is, each telluric symbol in Step \var{x}
maps one-to-one to a telluric descendant in
Step \var{y}.
What is the telluric symbol that \Vsym{tell}
maps to in \Vstr{descs}?

All the telluric symbols in
\eqref{eq:location-marker-cycle-12}
and
\eqref{eq:location-marker-cycle-14}
must be in
$\var{sf}@\var{x}$ and $\var{sf}@\var{y}$,
and
$\var{sf}@\var{x} = \var{sf}@\var{y}$,
so that the telluric symbols in
$\var{sf}@\var{x}$
must be the same, and in
the same order,
as those in
$\var{sf}@\var{y}$.
So a one-to-one mapping of telluric symbols from
$\var{sf}@\var{x}$
to telluric symbols in $\var{sf}@\var{y}$
must map each telluric symbol to itself.
Therefore, the telluric symbol in
$\Vstr{descs}@\var{y}$
is $\Vsym{tell}@\var{x}$.

We can therefore write the derivation of
\Vstr{descs} from
$\Vsym{tell}@\var{x}$,
without loss of generality,
as
\begin{equation}
\label{eq:location-marker-cycle-24}
\Vsym{tell} \deplus \Vstr{nulL} \Vsym{tell} \Vstr{nulR} = \Vstr{descs}
\end{equation}
where
$\Vstr{nulL} = \Vstr{nulR} = \epsilon$.
But, by the definition of cyclic,
\eqref{eq:location-marker-cycle-24}
is a cycle.
Cycles are not allowed in Marpa grammars,
which shows the outer reductio,
and the theorem.
\end{proof}

\chapter{Rewriting the grammar}
\label{ch:rewrite}

We have already noted
that no rules of \Cg{}
have a zero-length RHS,
and that all symbols must be either nulling or telluric.
These restrictions follow Aycock and Horspool~\cite{AH2002}.
The elimination of empty rules and proper nullables
is done by rewriting the grammar.
\cite{AH2002} shows how to do this
without loss of generality.

Because Marpa claims to be a practical parser,
it is important to emphasize
that all grammar rewrites in this monograph
allow the original grammar to be reconstructed
simply and efficiently at evaluation time.
As implemented,
the Marpa parser allows users to associate
semantics with an external grammar
that has none of the restrictions imposed
on the internal grammars.
As his external grammar,
the Marpa::R2 user
may specify any proper context-free grammar.
A ``proper'' grammar is one which is cycle-free,
and which contains no unproductive or inaccessible
symbols.\footnote{
In fact, as of this writing, Marpa::R2 has options
which allow grammars with cycles and inaccessible symbols,
but there is very little interest in these,
and future Marpa versions are likely to remove this support.
}

Marpa external grammars allow nullable,
properly nullable and nulling symbols,
as well as empty rules.
The user specifies his semantics in terms
of the external grammar.
Marpa rewrites the external grammar into
an internal grammar.
Parsing and evaluation
are performed
in such a way as to keep the internal grammar
invisible to
the user.
From the user's point of view,
the external grammar is the
one being used for the parse,
and the one to which
his semantics is applied.

The rewrite currently used by Marpa is an improvement over
that of~\cite{AH2002}.
Rules with proper nullables are identified
and a new grammar is created
in which the external grammar's rules are divided
up so that no rule has more than two proper nullables.
(A ``proper nullable'' is a nullable symbol which is not nulling.)
This is similar to a rewrite into Chomsky form.

The proper nullable symbol is then cloned into two others:
one nulling and one telluric.
All occurrences of the original proper nullable symbol are then replaced
with one of the two new symbols,
and new rules are created as necessary to ensure that all possible combinations
of nulling and telluric symbols are accounted for.

The rewrite in~\cite{AH2002} was similar, but did not do the Chomsky-style
rewrite before replacing the proper nullables.
As a result the number of rules in the internal grammar could be
an exponential function of numbers in the external grammar.
In our version, the worst case growth in the number of rules in linear.

This rewrite can be undone easily.
In fact,
in the current implementation of Marpa,
the reverse rewrite,
from internal to external,
is often done ``on the fly'',
as the parse proceeds.
This translation back and forth is
efficient,
and is done for error reporting, tracing,
and in the implementation of Marpa::R2's event
mechanism.

Future plans for Marpa include more aggressive use
of rewrites.
It should be possible, not only to eliminate proper
nullables from the internal grammar,
but also to eliminate nulling symbols.
We conjecture that elimination of nulling symbols
from the internal grammar will greatly simplify the implementation.
The reader may observe that it would
simplify this monograph if it did not have to deal with nulling
symbols.

Not all rewrites lend themselves to easy translation
and reversal.
As a future direction, we will look at a general schema
for ``safe'' grammar rewrites.
In this schema, Marpa's internal grammar will have
``brick'' and ``mortar'' symbols.
Internal brick symbols correspond, many-to-one, to
external symbols.
Internal mortar symbols exist entirely for the purposes
of the internal grammar.
Only brick symbols have semantics attached to them.

Assume that we have a parse, using internal symbols.
We define a ``brick traversal'' from a ``root'' brick non-terminal instance.
The ``brick traversal'' is pre-order
and stops traversing any path when it hits
a brick symbol instance other than the ``brick root''.
In this way, it traces a subtree of the parse,
where the root of the subtree is the brick root symbol instance,
and the leaves of the subtree are a sequence of other brick
symbol instances.
The leaves of the subtree, as encountered in pre-order,
constitute its ``brick frontier''.
Mortar symbols will only occur in the interior of this ``brick'' subtree,
never as its root or its leaf.

An internal symbol instance \textbf{matches}
an external symbol instance if and only if
\begin{itemize}
\item they have the same symbol;
\item they have the same left location; and
\item they have the same right location.
\end{itemize}

For a rewrite to be ``safe'':
\begin{itemize}
\item Every brick symbol must translate to exactly one
external symbol
\item Every terminal symbol instance must be a brick symbol.
\item The internal and external input sequences must be the same length.
\item The internal and external input sequences must allow
a shared indexing
scheme, which indexes the input symbols consecutively from
left to right.
\item
For every index \var{i},
the \var{i}'th symbol instance in the internal input sequence
must match
the \var{i}'th symbol instance in the external input sequence.
\item Every brick traveral must translate to an external rule
instance,
and vice versa,
as follows:
\begin{itemize}
\item The brick root symbol instance must match
the LHS symbol instance of the external rule instance.
\item
The brick frontier must be the same length as
the RHS of the rule.
\item
The brick frontier and the external rule RHS must allow a shared indexing
scheme,
which indexes both of them
consecutively
from left to right.
\item
For every index \var{i},
the \var{i}'th
instance in the brick frontier must
match the \var{i}'th symbol instance
of the external rule RHS.
\end{itemize}
\end{itemize}

\chapter{Dotted rules}
\label{ch:dotted}

\section{Definition}

\begin{definition}
\dtitle{Dotted rule}
\label{def:dotted-rule}
Let $\Vrule{r} \in \Crules$
be a rule.
Recall that \Vsize{r}
is the length of its RHS.
A dotted rule (type \dtype{DR}) is a duple, $[\Vrule{r}, \var{dotix}]$.
\var{dotix} is
the
\dfn{dot RHS index}
or
\dfn{dot index},
and is such that
$0 \le \var{dotix} \le \size{\Vrule{r}}$.
The dot index
indicates the extent to which
the rule has been recognized.
It is often
represented with a large raised dot.
so that if
\begin{equation*}
[\Vsym{A} \de \Vsym{X} \Vsym{Y} \Vsym{Z}]
\end{equation*}
is a rule,
\begin{equation}
\label{eq:def-dotted-rule-10}
\Vdr{dr} = [\Vsym{A} \de \Vsym{X} \Vsym{Y} \mydot \Vsym{Z}]
\end{equation}
is the dotted rule with the dot at
$\var{dotix} = 2$,
that is,
between \Vsym{Y} and \Vsym{Z}.

We write
\Vop{Dotix}{x}%
\index{recce-notation}{Dotix(x)@\Vop{Dotix}{x}}
for the dot index of
\Vdr{x},
and \Vop{Rule}{x}%
\index{recce-notation}{Rule(x)@\Vop{Rule}{x}}
for the rule of \Vdr{x}.
For example, where \Vdr{dr} is as in
\eqref{eq:def-dotted-rule-10},
\begin{gather*}
  \op{Dotix}{\Vdr{dr}} = 2 \\
  \text{and} \quad
\op{Rule}{\Vdr{dr}} = [\Vsym{A} \de \Vsym{X} \Vsym{Y} \Vsym{Z}].
\end{gather*}
\end{definition}

In the discussions to follow
we will also refer to a
``dot location''.
The dot location should not be confused with the
dot index.
Dot locations will be locations in the input,
and will require the dotted rule
to be placed in the context of an input,
as will be explained in
Chapter \ref{ch:earley-items}.

We will sometimes write the dotted rule as a duple,
for example,
we might write
\eqref{eq:def-dotted-rule-10}
as
\[
[ [ \Vsym{A} \de \Vsym{X} \Vsym{Y} \Vsym{Z} ], 2 ] \\
\]
or redundantly, as
\[
[ [ \Vsym{A} \de \Vsym{X} \Vsym{Y} \mydot \Vsym{Z} ], 2 ].
\]

\begin{definition}
\dtitle{Rule notions applied to dotted rules}
\label{def:dr-rule-notions}
Whenever we apply a rule notion to a dotted rule,
call it \Vdr{dr},
we mean to apply that notion to
the rule of the dotted rule,
or \Rule{\Vdr{dr}}.
\end{definition}

\section{Properties}

\begin{definition}
\dtitle{Postdot}
\label{def:postdot}
\index{recce-notation}{Postdot(dr)}%
\[
\Postdot{\Vdr{x}} \defined
\begin{cases}
\begin{aligned}
& \Vsym{B}, \; && \text{if $\Vdr{x} = [\Vsym{A} \de \Vstr{s1} \mydot \Vsym{B} \cat \Vstr{s2}]$} \\
& \undefined, \; && \text{if $\Vdr{x} = [\Vsym{A} \de \Vstr{rhs} \mydot]$}
\end{aligned}
\end{cases}
\]
\end{definition}

\begin{definition}
\dtitle{Predot}
\label{def:predot}
\index{recce-notation}{Predot(dr)}%
\[
\Predot{\Vdr{x}} \defined
\begin{cases}
\begin{aligned}
& \Vsym{B}, \; && \text{if $\Vdr{x} = [\Vsym{A} \de \Vstr{s1} \cat \Vsym{B} \mydot \Vstr{s2}]$} \\
& \undefined, \; && \text{if $\Vdr{x} = [\Vsym{A} \de \mydot \Vstr{rhs} ]$}
\end{aligned}
\end{cases}
\]
\end{definition}

\begin{definition}
\dtitle{Next}
\label{def:next}
\index{recce-notation}{Next(dr)}%
\[
\Next{\Vdr{x}} \defined
\begin{cases}
[\Vsym{A} \de \Vstr{s1} \cat \Vsym{B} \mydot \Vstr{s2}],  \\
\begin{aligned}
& \qquad && \text{if $\Vdr{X} =
[\Vsym{A} \de \Vstr{s1} \mydot \Vsym{B} \cat \Vstr{s2}]$} \\
& \undefined, && \text{if $\Vdr{x} = [\Vsym{A} \de \Vstr{rhs} \mydot]$}
\end{aligned}
\end{cases}
\]
\end{definition}

\begin{definition}
\dtitle{Prev}
\label{def:prev}
\index{recce-notation}{Prev(dr)}%
\[
\Prev{\Vdr{x}} \defined
\begin{cases}
[\Vsym{A} \de \Vstr{s1} \mydot \Vsym{B} \cat \Vstr{s2}],  \\
\begin{aligned}
& \qquad && \text{if $\Vdr{X} =
[\Vsym{A} \de \Vstr{s1} \cat \Vsym{B} \mydot \Vstr{s2}]$} \\
& \undefined, && \text{if $\Vdr{x} = [\Vsym{A} \de \mydot \Vstr{rhs} ]$}
\end{aligned}
\end{cases}
\]
\end{definition}

\begin{definition}
\dtitle{Prefix and suffix}
\label{def:prefix}
If a dotted rule is
\[
[\Vsym{A} \de \Vstr{prefix} \mydot \Vstr{suffix}]
\]
we say that \Vstr{prefix} is the
\dfn{dot prefix},
and that
\Vstr{suffix} is the
\dfn{dot suffix}.
\end{definition}

\section{Types}

The \dfn{start dotted rule} is
\begin{equation}
\label{eq:start-rule-def-10}
\Vdr{start} = [\Vsym{accept} \de \mydot \Vsym{start} ].
\end{equation}
The \dfn{accept dotted rule} is
\begin{equation*}
\label{eq:accept-rule-def-10}
\Vdr{accept} = [\Vsym{accept} \de \Vsym{start} \mydot ].
\end{equation*}

We divide all dotted rules into five disjoint types:
start, prediction, null-scan, read and reduction.

\begin{baredefinition}
\dtitle{Start}
\label{def:start-dr}
The
start dotted rule was defined
in \eqref{eq:start-rule-def-10}.
Its type is
\xdfn{start}{start (dotted rule)}.
\end{baredefinition}

\begin{baredefinition}
\dtitle{Prediction}
\label{def:prediction-dr}
If a rule does not have a predot symbol and is not the start dotted rule,
it is a
\xdfn{predicted dotted rule}{predicted (dotted rule)}
or a
\xdfn{prediction}{prediction (dotted rule)}.
\end{baredefinition}

A predicted dotted rule
always has a dot position of zero,
for example,
\begin{equation*}
\Vdr{predicted} = [\Vsym{A} \de \mydot \Vstr{alpha} ].
\end{equation*}

\begin{baredefinition}
\dtitle{Null-scan}
\label{def:null-scan-dr}
If a rule does have a predot symbol and that symbol is a nulling terminal,
that rule
is a
\xdfn{null-scan}{null-scan (dotted rule)}
dotted rule.
\end{baredefinition}

\begin{baredefinition}
\dtitle{Read}
\label{def:read-dr}
If a rule does have a predot symbol and that symbol is a telluric terminal,
the rule is a
\xdfn{read}{read (dotted rule)}
dotted rule.
\end{baredefinition}

\begin{definition}
\dtitle{Reduction}
\label{def:reduction-dr}
If a rule does have a predot symbol and that symbol is a non-terminal
it is a
\xdfn{reduced}{reduced (dotted rule)}
dotted rule,
or a
\xdfn{reduction}{reduction (dotted rule)}.
\end{definition}

\begin{definition}
\dtitle{Ethereal and telluric dotted rules}
\label{def:telluric-dr}
A start dotted rule,
or a dotted rule with a telluric predot symbol
is called
a \xdfn{telluric}{telluric!DR}
dotted rule.
All other dotted rules are called
\xdfn{ethereal}{ethereal!DR}
dotted rules.
\end{definition}

The idea is that telluric dotted rules are ``grounded'' either
in the input or in the initial state of the parse,
while
ethereal dotted rules emerge out of an ``invisible'' realm.

\begin{theorem}
\ttitle{Ethereal and telluric dotted rules}
\label{t:telluric-dr}
Prediction and null-scan dotted rules are ethereal
dotted rules.
Start, reduction and read dotted rules are telluric.
\end{theorem}

\begin{proof}
The theorem follows from
\dref[start DR]{def:start-dr},
\dref[prediction DR]{def:prediction-dr},
\dref[null-scan DR]{def:null-scan-dr},
\dref[read DR]{def:read-dr},
\dref[reduction DR]{def:reduction-dr},
and
\dref[telluric and ethereal DR's]{def:telluric-dr}.
\end{proof}

\begin{definition}
\dtitle{Confirmed dotted rules}
\label{def:confirmed-drs}
A
\xdfn{confirmed dotted rule}{confirmed (dotted rule)},
or
\xdfn{confirmation}{confirmation (dotted rule)},
is a dotted rule
with a dot position greater than zero.
A
\xdfn{complete dotted rule}{complete (dotted rule)},
is a dotted rule with its dot
position after the end of its RHS,
for example,
\begin{equation*}
\Vdr{complete} = [\Vsym{A} \de \Vstr{alpha} \mydot ].
\end{equation*}
\end{definition}

\begin{definition}
\dtitle{Penultimate dotted rules}
\label{def:penultimate-drs}
A
\xdfn{penultimate dotted rule}{penultimate (dotted rule)},
or a
\xdfn{penult}{penult (dotted rule)},
is a dotted rule with exactly one symbol
between its
dot position and the end of its RHS,
for example,
\begin{equation*}
\Vdr{penult} = [\Vsym{A} \de \Vstr{alpha} \mydot \Vsym{B} ].
\end{equation*}
\end{definition}

\section{Quasi-types}

When classifying dotted rules,
it is often convenient
to ignore the effect of nulling symbols.
Intuitively, if a dotted rule is of the kind ``X'',
then a quasi-X dotted rule is a dotted rule that would be
of kind X, if it were not for its nulling symbols.

\begin{definition}
\dtitle{Quasi-types}
\label{def:quasi-types}
A dotted rule which has only nulling symbols in its dot
suffix is
\xdfn{quasi-complete}{quasi-complete (dotted rule)}.
A quasi-complete dotted rule is called an
\xdfn{quasi-complete}{quasi-complete (dotted rule)}.

A dotted rule which has exactly one telluric symbol in
its dot suffix is
\xdfn{quasi-penultimate}{quasi-penultimate (dotted rule)}.
A quasi-penultimate dotted rule is called an
\xdfn{quasi-penult}{quasi-penult (dotted rule)}.

If a dotted rule is not quasi-complete,
it is said to be
\xdfn{quasi-incomplete}{quasi-incomplete (dotted rule)}.

A dotted rule which has only nulling symbols before the dot
is a
\xdfn{quasi-predicted}{quasi-predicted (dotted rule)}
dotted rule,
or a
\xdfn{quasi-prediction}{quasi-prediction (dotted rule)}.
If a dotted rule is not a
quasi-prediction,
then it is a
\xdfn{quasi-confirmed}{quasi-confirmed (dotted rule)}
dotted rule,
or a
\xdfn{quasi-confirmation}{quasi-confirmation (dotted rule)}.
\end{definition}

The definitions of the quasi-types may be satisfied vacuously:
for example,
all complete dotted rules are quasi-complete dotted rules
and
all predicted dotted are quasi-predicted dotted rules.

\begin{definition}
\dtitle{Completion of a dotted rule}
\label{def:completion-of-a-dotted-rule}
If
\begin{equation*}
\begin{split}
\Vdr{quasi} & = [\Vsym{A} \de \Vstr{alpha} \mydot \Vstr{nulls} ] \\
\Vdr{completion} & = [\Vsym{A} \de \Vstr{alpha} \cat \Vstr{nulls} \mydot ] \\
& \qquad \text{where} \quad \Vstr{nulls} = \epsilon
\end{split}
\end{equation*}
is a pair of dotted rules,
we say that \Vdr{completion} is the
\xdfn{completion dotted rule}{completion (dotted rule)!wrt another dotted rule}
of the quasi-complete dotted rule \Vdr{quasi}.
\end{definition}

This definition may be satisfied vacuously:
all predictions are quasi-predictions.

\begin{theorem}
\ttitle{Quasi-predicted dotted rule is not quasi-completed}
\label{t:quasi-drs-disjoint}
In Marpa grammars,
no quasi-completed dotted rule
is a quasi-predicted dotted rule.
\end{theorem}

\begin{proof}
The rewrite of
Marpa grammars
eliminates all nullable rules.
So every rule must have a telluric symbol.
In a dotted rule, therefore,
there must be
at least one telluric symbol
and it must come either before the dot
or after it.
If a telluric symbol comes before the dot,
the dotted rule might be quasi-completed,
but it cannot be a quasi-prediction.
If a telluric symbol comes after the dot,
the dotted rule might be a quasi-prediction,
but it cannot be quasi-complete.
\end{proof}

\section{Fleeting and lasting bases}

A dotted rule with a null predot symbol is called a
\xdfn{fleeting base}{fleeting base (dotted rule)}.
Any other dotted rule is called
\xdfn{lasting base}{lasting base (dotted rule)}.
A prediction is always a lasting base.

Every dotted rule,
even if it is not a lasting base itself,
has a
\xdfn{lasting base}{lasting base (dotted rule)!wrt another dotted rule}
\Vdr{bas} is the lasting base of \Vdr{dr}
if and only if
\Vdr{bas} is a lasting base,
and
\begin{equation}
\label{eq:def-lasting-base-10}
\forall \; \var{i} : 0 \le \var{i} < \Dotix{\Veim{dr}}
\implies \RHS{\Vdr{dr}, \var{i}} = \epsilon
\end{equation}
Note that
\ref{eq:def-lasting-base-10}
may be satisfied vacuously ---
a prediction is its own lasting base.

\begin{theorem}
\ttitle{Dotted rule lasting base}
\label{dotted-rule-lasting-base}
Every dotted rule has a lasting base.
\end{theorem}

\begin{proof}
The lasting base of a dotted rule is another,
not necessarily disinct, dotted rule.
Let \Vdr{dr} be a dotted rule.
If
\[
  \Predot{\Vdr{dr}} \neq \epsilon \; \lor \;
  \Predot{\Vdr{dr}} = \undefined,
\]
then \Vdr{dr} is its own lasting base.
If $\Predot{\Vdr{dr}} = \epsilon$ so that,
without loss of generality,
\begin{equation}
\Vdr{dr} = [\Vsym{A} \de \Vstr{before} \Vstr{nulls} \Vsym{nul} \mydot \Vstr{after} ]
\end{equation}
where $\Vstr{nulls} = \epsilon$
and $\Vsym{nul} = \epsilon$,
then the
lasting base
of \Vdr{dr} is
\begin{equation}
[\Vsym{A} \de \Vstr{before} \mydot \Vstr{nulls} \Vsym{nul} \Vstr{after} ]
\qedhere
\end{equation}
\end{proof}

\section{The transition function}

We define
a partial transition function from
pairs of dotted rule and symbol
to sets of dotted rules.
\begin{equation*}
\GOTO: \Cdr, (\epsilon \cup \var{vocab}) \mapsto 2^\Cdr.
\end{equation*}
$\GOTO(\Vdr{from}, \epsilon)$ is a
\dfn{null transition}
and its result is a \dfn{null transition set}.
``null'' is an overloaded term,
so we more often call the null transition
an \dfn{ethereal transition}
and the null transition set
an \dfn{ethereal transition set}.
If a transition is not an ethereal transition,
it is a \dfn{telluric transition},
and if a transition set
is not an ethereal transition set,
it is a \dfn{telluric transition set}.

A telluric transition set is always the empty set
or a singleton set.
Only ethereal transition sets have
cardinalities greater than one.
The dotted rules in the set that results from an ethereal transition
will be either predictions or confirmed rules with
a nulling predot symbol.

Where the transition is over a symbol,
call it \Vsym{A},
\begin{multline*}
\GOTO(\Vdr{from}, \Vsym{A}) = \\
\begin{cases}
\begin{aligned}
& \left\lbrace \Next{\Vdr{from}} \right\rbrace,
  && \text{if $\Vsym{A} = \Postdot{\Vdr{from}}$} \\
& \emptyset,
  && \text{otherwise}
\end{aligned}
\end{cases}
\end{multline*}

Ethereal transitions are more complicated,
but their analysis will come in useful later.
Let \var{null-scan-dr-op} be the set of
pairs of dotted rules
\begin{equation}
\label{eq:def-null-scan-dr-op}
\begin{gathered}
\left\lbrace \Vdr{cause}, \Vdr{effect} \right\rbrace \quad \text{such that} \\
\Vdr{effect} = \Next{\Vdr{cause}} \quad \text{and} \\
\Predot{\Vdr{effect}} \derives \epsilon.
\end{gathered}
\end{equation}

\begin{definition}
\dtitle{Causes of null scan dotted rule}
\label{def:causes-null-scan-dr}
In equation
\eqref{eq:def-null-scan-dr-op},
we say that \Vdr{cause} is the
\xdfn{top-down cause}{top-down cause!DR as top-down cause of null-scan DR}
of \Vdr{effect},
and that \Predot{\Vdr{effect}} is the
\xdfn{bottom-up cause}{bottom-up cause!DR as bottom-up cause of null-scan DR}
of \Vdr{effect}.
\end{definition}

We can use \var{null-scan-dr-op} to define an equivalence relation.
Intuitively, two dotted rules, \Vdr{dr1}
and \Vdr{dr2} are \dfn{ethereally equivalent} if
\Vdr{dr1} can be changed into \Vdr{dr2}
by iteration of \var{null-scan-dr-op}.
More formally, we define \var{eth-eq} to be the reflexive, symmetric
and transitive closure of
\var{null-scan-dr-op}.
We say that \Vdr{dr1} is
\dfn{ethereally equivalent} to \Vdr{dr2} if
and only if
\Vdr{dr1} is an element of the
equivalence class of \var{eth-eq} under \Vdr{dr2}.

Let \var{predict-dr-op} be the set of
pairs of dotted rules
\begin{equation}
\label{eq:def-predict-dr-op}
\begin{gathered}
\left\lbrace \Vdr{cause}, \Vdr{effect} \right\rbrace \quad \text{such that} \\
\Postdot{\Vdr{cause}} = \LHS{\Vdr{effect}} \quad \text{and} \\
\Dotix{\Vdr{effect}} = 0
\end{gathered}
\end{equation}

\begin{definition}
\dtitle{Causes of predicted dotted rules}
\label{def:causes-predicted-dr}
In equation
\eqref{eq:def-predict-dr-op},
we say that \Vdr{cause} is the
\xdfn{top-down cause}{top-down cause!DR as top-down cause of a predicted DR}
of \Vdr{effect}.
For symmetry with other types of dotted rule,
we say that \Vdr{effect}
has a bottom-up cause,
but that the
\xdfn{bottom-up cause}{bottom-up cause!DR, as bottom-up cause of a predicted DR}
of \Vdr{effect}
is ethereal.
\end{definition}

\begin{FlushLeft}
Let
\begin{equation}
\var{epsilon-dr-op} = \var{null-scan-dr-op} \cup \var{predict-dr-op}.
\end{equation}
We are now in a position to define the ethereal transition of \GOTO{}
from the dotted rule \Vdr{base}.
It is the transitive closure of \var{epsilon-op}
over the singleton set containing the dotted rule argument of \GOTO{}
if there is a postdot symbol.
Otherwise it is the empty set.
\begin{multline*}
\GOTO(\Vdr{from}, \epsilon) = \\
\begin{cases}
\begin{aligned}
& \var{epsilon-op}^+(\lbrace \Vdr{base} \rbrace),
  && \text{if $\Postdot{\Vdr{from}} \neq \undefined$} \\
& \emptyset,
  && \text{otherwise}
\end{aligned}
\end{cases}
\end{multline*}

\end{FlushLeft}

The
\xdfn{ethereal closure}{ethereal closure (of a dotted rule)}
is the reflexive and transitive closure of
\var{epsilon-dr-op}:
\[\var{ethereal-dr-closure} \defined \var{epsilon-dr-op}^\ast.\]
We say that
the ethereal closure for a dotted rule is the ethereal closure of the singleton
set containing that dotted rule:
\begin{multline*}
\var{ethereal-dr-closure}(\Vdr{base}) \defined  \var{ethereal-dr-closure}(\lbrace \Vdr{base} \rbrace)
\end{multline*}

Let
\begin{equation}
\Vdrset{ec} = \var{ethereal-dr-closure}(\lbrace \Vdr{base} \rbrace).
\end{equation}
We also call \Vdrset{ec} an \dfn{ethereal closure}
and we say that \Vdr{base} is its \dfn{base}.
If \Vdr{base} is telluric, we say that
\Vdr{base} is a \dfn{telluric base}.
We call \Vdr{tell} a telluric base
of a dotted rule \Vdr{dr2} if and only if
it is telluric and
\[ \Vdr{dr2} \in \var{ethereal-dr-closure}(\lbrace \Vdr{tell} \rbrace). \]

\section{Ethereal closures}

\begin{theorem}
\ttitle{Ethereal equivalents have same telluric base}
\label{t:eth-eq-share-telluric-base}
If the dotted rules \Vdr{dr1}
and \Vdr{dr2} are ethereally equivalent,
and \Vdr{dr1} is quasi-confirmed,
then \Vdr{dr1}
and \Vdr{dr2} have the same telluric base.
\end{theorem}

\begin{proof}
By assumption for the theorem,
\Vdr{dr1} is quasi-confirmed,
so that
by Theorem \ref{t:quasi-drs-disjoint},
\Vdr{dr1}
is not a quasi-prediction.
Therefore, \Vdr{dr1} has a telluric symbol in its
dot prefix.
Therefore,
\Vdr{dr1} has a telluric base.
Without loss of generality,
we let
\begin{equation}
\label{eq:eth-eq-share-telluric-base-10}
\Vdr{dr1} = [ \Vsym{A} \de \Vstr{pre} \cat \Vsym{tell} \cat \Vstr{nulls1} \mydot \Vstr{post1} ],
\end{equation}
and let the telluric base be
\begin{equation}
\label{eq:eth-eq-share-telluric-base-20}
\Vdr{tell} = [ \Vsym{A} \de \Vstr{pre} \cat \Vsym{tell} \mydot \Vstr{nulls1} \cat \Vstr{post1} ],
\end{equation}
where $\Vstr{nulls1} = \epsilon$.

We now proceed by overlapping cases.
In the first case,
the dot in \Vdr{dr2} comes at or after the dot in \Vdr{dr1}.
Since \Vdr{dr2} is ethererally equivalent
to
\eqref{eq:eth-eq-share-telluric-base-10},
we have,
if we rewrite \Vstr{post1}
as $\Vstr{nulls2} \cat \Vstr{post2}$,
\begin{multline}
\label{eq:eth-eq-share-telluric-base-23}
\Vdr{dr2} =
  [ \Vsym{A} \de \Vstr{pre} \cat \Vsym{tell} \cat \Vstr{nulls1} \cat \Vstr{nulls2} \mydot \Vstr{post2} ].
\end{multline}
Therefore, from
\eqref{eq:eth-eq-share-telluric-base-20},
\eqref{eq:eth-eq-share-telluric-base-23}
and the definition of ethereal closure,
\[ \Vdr{dr2} \in \var{ethereal-dr-closure}(\lbrace \Vdr{tell} \rbrace).\]
By the definition of telluric base,
\Vdr{tell} is the telluric base of \Vdr{dr2}.

In the second case
the dot in \Vdr{dr2} comes at or before the dot in \Vdr{dr1}.
We may write
\begin{equation*}
\Vdr{dr2} = [ \Vsym{A} \de \Vstr{pre} \cat \Vsym{tell} \cat \Vstr{nulls1a} \mydot \Vstr{nulls1b} \cat \Vstr{post1} ],
\end{equation*}
where $\Vstr{nulls1} = \Vstr{nulls1a} \cat \Vstr{nulls1b}.$
Again,
by the definition of telluric base,
\Vdr{tell} is the telluric base of \Vdr{dr2}.
In both cases,
we have shown that
\Vdr{tell} is the telluric base of \Vdr{dr2}.
\end{proof}

\begin{theorem}
\ttitle{Telluric base of a quasi-confirmed dotted rule is unique}
\label{quasi-confirmed-unique-telluric-base}
If a dotted rule is quasi-confirmed,
its telluric base is unique.
\end{theorem}

\begin{proof}
Let the dotted rule be \Vdr{dr}.
This theorem follows
directly
from Theorem \ref{t:eth-eq-share-telluric-base},
if you set both of its dotted rules to \Vdr{dr}.
\end{proof}

The complexity of the ethereal closure is of interest:
we may want to compute it on the fly,
and in any case,
we certainly want to show that
the ethereal closure has finite time complexity.
\begin{algorithm}[tb]
\algtitle{Add a generation to the ethereal closure}{alg:ethereal-generation}
\begin{algorithmic}[1]
\Procedure{Ethereal next}{\Vdr{this}, \Vdrset{results}, \Vdrset{work}}
\If{\Vdr{this} has no postdot symbol}
\State return
\EndIf
\State Here \Vdr{this} is $[ \Vsym{lhs} \de \Vstr{before} \mydot \Vsym{A} \cat \Vstr{after} ]$
\label{line:ethereal-generation-20}
\State \Comment We can state this without loss of generality
\If{$\Vsym{A}$ is a nulling symbol}
\State $\Vdr{new} \gets [ \Vsym{lhs} \de \Vstr{before} \cat \Vsym{A} \mydot \Vstr{after} ]$
\State Add \Vdr{new} to \Vdrset{results} \ldots
\State $\qquad$ but only if it has never been added before
\State Add \Vdr{new} to \Vdrset{work} \ldots
\State $\qquad$ but only if it has never been added before
\State return
\EndIf
\label{line:ethereal-generation-40}
\State Here \Vsym{A} must be a telluric symbol
\For{ each \Vrule{r} in \Cg{}}
\If{ $\LHS{\Vrule{r}} = \Vsym{A}$ }
\State Here \Vrule{r} is $[ \Vsym{A} \de \Vstr{rhs} ]$
\State \Comment We can state this without loss of generality
\State $\Vdr{new} \gets [ \Vsym{A} \de \mydot \Vstr{rhs} ]$
\State Add \Vdr{new} to \Vdrset{results} \ldots
\State $\qquad$ but only if it has never been added before
\State Add \Vdr{new} to \Vdrset{work} \dots
\label{line:ethereal-generation-60}
\State $\qquad$ but only if it has never been added before
\EndIf
\EndFor
\State return
\EndProcedure
\end{algorithmic}
\end{algorithm}

\begin{algorithm}[tb]
\algtitle{Create ethereal closure}{alg:ethereal-closure}
\begin{algorithmic}[1]
\Function{Create ethereal closure}{\Vdr{base}}
\State $\Vdrset{result} \gets \emptyset$
\State $\Vdrset{work} \gets \emptyset$
\State \Call{Ethereal next}{\Vdr{base}}
\While{$\Vdrset{work} \neq \emptyset$}
\State Remove a dotted rule from \Vdrset{work}, call it \Vdr{this}
\State \Call{Ethereal next}{\Vdr{this}, \Vdrset{result}, \Vdrset{work}}
\EndWhile
\State return \Vdrset{result}
\EndFunction
\end{algorithmic}
\end{algorithm}

Algorithm \ref{alg:ethereal-closure}
is not actually used by any
of Marpa's versions ---
it is chosen because it is
convenient for exploring the theory.
In the actual implementation,
null-scans are dealt with implicitly,
while predictions are explicitly computed after
each Earley set is otherwise complete.

\begin{theorem}\label{t:ethereal-closure-Oc}
\ttitle{Ethereal closure is constant time}
Ethereal closure has time complexity \Oc{}.
\end{theorem}

\begin{proof}
We consider Algorithm \ref{alg:ethereal-closure}.
This clearly runs in \Oc{} time if there is a constant
number of calls to
Algorithm \ref{alg:ethereal-generation}.

To finish the proof, we need to show
that
Algorithm \ref{alg:ethereal-generation}
is called a constant number
of times.
Algorithm \ref{alg:ethereal-generation}
is called
once for the base dotted rule of the computation.
It is called again for every dotted rule added to the working set
of dotted rules, \Vdrset{work}.
We know that no dotted rule is added to
\Vdrset{work} twice.
Therefore
Algorithm \ref{alg:ethereal-generation}
is called
at most once for each dotted rule.
\Cg{} has a fixed number of dotted rules,
so
that Algorithm \ref{alg:ethereal-generation}
is called
at most \Oc{} times.
\end{proof}

\begin{theorem}\label{t:ethereal-closure-dr-correct}
\ttitle{Ethereal closure algorithm is correct}
Algorithm \ref{alg:ethereal-closure} is correct.
\end{theorem}

\begin{proof}
From examining
Algorithm \ref{alg:ethereal-closure},
in particular
lines
\ref{line:ethereal-generation-20}-\ref{line:ethereal-generation-40}
of
Algorithm \ref{alg:ethereal-generation},
we see that
\begin{equation}
\label{ethereal-closure-correct-2}
\myparbox{
the null transitions
for nulling postdot symbols are complete and consistent,
and therefore correct.
}
\end{equation}

From examining
Algorithm \ref{alg:ethereal-closure},
in particular
lines
\ref{line:ethereal-generation-20}-\ref{line:ethereal-generation-40}
of
Algorithm \ref{alg:ethereal-generation},
we see that the null transitions for predictions are
properly made,
so that
\begin{equation}
\label{ethereal-closure-correct-3}
\myparbox{
the set of predictions is consistent.
}
\end{equation}

It remains to show that the set of predictions is complete.
Algorithm \ref{alg:ethereal-closure}
clearly adds all predictions derivable in a single step
to its results.
It also
calls the ``Ethereal next'' function
repeatedly, so that indirect predictions will be added.
But it will refuse to
add a dotted rule to its working set more than once.
We need to consider whether this means some predictions
will not be derived.

Consider a prediction
\begin{equation}
\label{ethereal-closure-correct-5}
\Vsym{lhs-pred} \de \mydot \Vsym{pred-rhs}
\end{equation}
which is derived through a series of dotted rule predictions
added to the work list at line
\ref{line:ethereal-generation-60}
of Algorithm \ref{alg:ethereal-generation}.
For a reductio,
assume that one prediction,
call it
\begin{equation}
\label{ethereal-closure-correct-15}
[ \Vsym{lhs-dup} \de \mydot \Vsym{rhs-dup} ],
\end{equation}
occurs twice.
Without loss of generality, let that chain be
\begin{align*}
& [ \Vsym{lhs0} \de \mydot \Vsym{rhs0} ] && \text{Step 0} \\
& [ \Vsym{lhs1} \de \mydot \Vsym{rhs1} ] && \text{Step 1} \\
& \ldots && \\
& [ \Vsym{lhs-predup} \de \mydot \Vsym{lhs-dup} \cat \Vstr{after-predup} ] && \text{Step \Vdecr{i}} \\
& [ \Vsym{lhs-dup} \de \mydot \Vsym{rhs-dup} ] && \text{Step \var{i}} \\
& \ldots && \\
& [ \Vsym{lhs-predup2} \de \mydot \Vsym{lhs-dup} \cat \Vstr{after-predup2} ] && \text{Step \Vdecr{j}} \\
& [ \Vsym{lhs-dup} \de \mydot \Vsym{rhs-dup} ] && \text{Step \var{j}}\\
& \ldots && \\
& [ \Vsym{lhs-penult} \de \mydot \Vsym{rhs-penult} ] && \\
& [ \Vsym{lhs-last} \de \mydot \Vsym{rhs-last} ]
\end{align*}
where Step \var{i} is the first occurrence of
\eqref{ethereal-closure-correct-15},
and Step \var{j} is the last.
We can create a shorter chain of predictions by removing the steps in
the chain from Step $\var{i}+1$ to Step \var{j}.
Call this process of removing steps, ``pruning duplicates''.

By pruning duplicates for every prediction which occurs twice in
the chain,
we see that we can create a chain that results in
\eqref{ethereal-closure-correct-5},
but which does not contain any prediction more than once.
We can also see that, since
Algorithm \ref{alg:ethereal-closure} follows all chains
that contain no duplicate predictions,
that
Algorithm \ref{alg:ethereal-closure} will add
\eqref{ethereal-closure-correct-5} to its result.

Since
\eqref{ethereal-closure-correct-5} was chosen without loss
of generality,
we see that every prediction can be reached by following
a chain of predictions with no duplicate predictions,
and that therefore
\begin{equation}
\label{ethereal-closure-correct-40}
\myparbox{
Algorithm \ref{alg:ethereal-closure} adds a complete
set of predictions.
}
\end{equation}

We now summarize our results.
By definition, the ethereal closure is the
transitive closure of the union
of predictions and null-scans.
In \eqref{ethereal-closure-correct-2}
we showed that the sets of
null-scans added are correct and,
in \eqref{ethereal-closure-correct-3},
that the set of predictions added is consistent.
In
\eqref{ethereal-closure-correct-40}
we showed
that the set of predictions
added is complete.
This shows the theorem.
\end{proof}

\chapter{Earley items}
\label{ch:earley-items}

\section{Definition}

An Earley item (type \dtype{EIM})
is a triple
\[
    [\Vdr{dotted-rule}, \Vorig{x}, \Vloc{current} ]
\]%
\index{recce-notation}{[3]@[ dr, origin, current ]}%
\index{recce-notation}{[3]@[ dr, origin, current ]!EIM as 3-tuple}
of dotted rule, origin, and current location.

The \dfn{origin} is the location where recognition of the rule
started.
(It is sometimes called the ``parent''.)
The \dfn{current} or \dfn{dot location} is the location
in the input, \Cw{}, of the dot position in \Vdr{dotted-rule}.
For convenience, the type \dtype{ORIG} will be a synonym
for \type{LOC}, indicating that the variable designates
the origin element of an Earley item.
\begin{gather*}
\text{Where $\Veim{x} = [\Vdr{x}, \Vorig{x}, \Vloc{x}]$ we say that} \\
\begin{aligned}
\DR{\Veim{x}} & = \Vdr{x}, \\
\Origin{\Veim{x}} & = \Vorig{x}, \\
\Current{\Veim{x}} & = \Vloc{x}, \\
\Left{\Veim{x}} & = \Vorig{x}, \; \text{and} \\
\Right{\Veim{x}} & = \Vloc{x}. \\
\end{aligned}
\end{gather*}%
\index{recce-notation}{DR(eim)@\DR{eim}}%
\index{recce-notation}{Origin(eim)@\DR{eim}}%
\index{recce-notation}{Current(eim)@\Current{eim}}%
\index{recce-notation}{Left(eim)@\Left{eim}}%
\index{recce-notation}{Right(eim)@\Right{eim}}

Traditionally, an Earley item is shown as a duple,
\[
    [\Vdr{dotted-rule}, \Vorig{x} ]
\]%
\index{recce-notation}{[2]@[ dr, origin ]}%
\index{recce-notation}{[2]@[ dr, origin ]!EIM as duple}
with \Vloc{current} omitted,
and we will sometimes use this form.
When the duple form is used,
the current location is specified by the context,
either explicitly or implicitly.

\section{Types}

\begin{definition}
\dtitle{Dotted rule notions applied to EIMs}
\label{def:eim-dr-notions}
Whenever we apply a dotted rule notion to an EIM,
we mean to apply that notion to the dotted rule of the EIM.
For example, a
\xdfn{complete EIM}{complete (EIM)!wrt another EIM}
a complete EIM is an EIM with a complete
dotted rule, and a
\xdfn{predicted EIM}{predicted (EIM)}
is an EIM with a predicted dotted rule.
If
\[
  \Veim{quasi} = [ \Vdr{quasi}, \var{i}, \var{j} ]
\]
is a quasi-complete EIM,
then its
\xdfn{completion EIM}{completion EIM!wrt another EIM}
or
\xdfn{completion (EIM)}{completion (EIM)!wrt another EIM}
is
\[
  \big[ [ \Rule{\Veim{quasi}}, \Vdecr{\Vsize{\Rule{\Veim{quasi}}}} ],
    \var{i}, \var{j}
  \big].
\]
\end{definition}

\begin{definition}
\dtitle{Rule notions applied to EIMs}
\label{def:eim-rule-notions}
Whenever we apply a rule notion to an EIM,
call it \Veim{e},
we mean to apply that notion to
the rule of the dotted rule of the EIM,
or \Rule{\DR{\Veim{e}}}.
\end{definition}

\begin{definition}
\dtitle{Start EIM}
\label{def:start-eim}
The \dfn{start EIM} is
\begin{equation}
\label{eq:def-start-eim-10}
\Veim{start} = [ [\Vsym{accept} \de \mydot \Vsym{start} ], 0, 0 ].
\end{equation}
\end{definition}

\begin{definition}
\dtitle{Accept EIM}
\label{def:accept-eim}
The \dfn{accept EIM} is
\begin{equation}
\label{eq:def-accept-eim-10}
\Vdr{accept} = [ [\Vsym{accept} \de \Vsym{start} \mydot ], 0, \Vsize{\Cw} ].
\end{equation}
\end{definition}

\begin{theorem}
\ttitle{Earley item types}
\label{eim-types-correct}
Every EIM falls into one of these
five disjoint types:
start, prediction, read, null-scan and reduction.
\end{theorem}

\begin{proof}
Recall that EIM's take their type from their dotted rule.
The proof then follows directly from definitions
\ref{def:start-dr},
\ref{def:prediction-dr},
\ref{def:null-scan-dr},
\ref{def:read-dr}
and \ref{def:reduction-dr}
above.
\end{proof}

\begin{definition}
\dtitle{Telluric and ethereal EIM's}
\label{def:telluric-eim}
An EIM is
\xdfn{telluric}{telluric!EIM}
if its dotted rule is telluric
and 
\xdfn{ethereal}{ethereal!EIM}
if its dotted rule is ethereal.
\end{definition}

\begin{theorem}
\ttitle{Telluric and ethereal EIM's}
\label{t:telluric-eim}
An EIM is telluric if it is the
start EIM,
a read EIM or a reduction EIM.
An EIM is ethereal if it is a null-scan
EIM or a prediction EIM.
\end{theorem}

\begin{proof}
The theorem follows directly from
\tref{t:telluric-dr} and
\dref[telluric EIM's]{def:telluric-eim}.
\end{proof}

\section{Locsyms}

\begin{definition}
\dtitle{Locsym}
\label{def:locsym}
A
\xdfn{located symbol}{located symbol@located symbol|mysee{locsym}}
or
\qdfn{locsym}
is a duple consisting of a symbol
and a parse location:
\[
< \Vsym{sym}, \Vloc{loc} >.
\]
\end{definition}

\begin{definition}
\dtitle{Locsym of an EIM}
\label{def:eim-locsym}
The
\qdfn{external locsym}%
\index{recce-definitions}{external locsym@external locsym!of an EIM}
of the EIM \Veim{eim}
is
\[
<\LHS{\Veim{e}}, \Left{\Veim{e}}>.
\]
References to the
\qdfn{locsym}%
\index{recce-definitions}{locsym@locsym!of an EIM}%
\index{recce-definitions}{locsym@locsym|seealso {external locsym}}
of an EIM
are to its external locsym.
We also write the locsym of \Veim{eim} as \LSY{\Veim{eim}}.
\end{definition}

\begin{definition}
\dtitle{Locsym of a parse instance}
\label{def:inst-locsym}
The
\qdfn{locsym}%
\index{recce-definitions}{locsym@locsym!of an INST}
of the parse instance \Vinst{inst}
is
\[
<\Symbol{\Vinst{inst}}, \Left{\Vinst{inst}}>.
\]
We also write the locsym of \Vinst{inst} as \LSY{\Vinst{inst}}.
\end{definition}

\begin{definition}
\dtitle{Postdot locysm}
\label{def:postdot-locsym}
The
\qdfn{postdot locsym}%
\index{recce-definitions}{postdot locsym@postdot locsym!of an EIM}
of the EIM \Veim{eim}
is
\[
<\Postdot{\Veim{e}}, \Current{\Veim{e}}>,
\]
if
\Postdot{\Veim{e}} is defined.
We also write the postdot locsym of \Veim{eim} as \PLSY{\Veim{eim}}.
If \Postdot{\Veim{e}} is not defined,
then \PLSY{\Veim{eim}} is undefined.
\end{definition}

\section{Validity}

\begin{definition}
\label{def:eim-valid}
\dtitle{EIM Validity}
We say that
an Earley item
\begin{equation}
\label{eq:def-eim-valid-5}
\bigl[[\Vsym{A} \de \Vstr{predot} \mydot \Vstr{postdot}], \var{i}, \var{j} \bigr]
\end{equation}
is
\xdfn{valid}{valid (EIM)}
if and only if
\begin{equation}
\label{eq:def-eim-valid-10}
\Vsym{A} \derives [\var{i}]\, \Vstr{predot} \,[\var{j}]\, \Vstr{postdot}.
\end{equation}
Note that
\eqref{eq:def-eim-valid-10}
implies that \CW{} is seen as far as \Vloc{j}.
If \Veim{x} is valid, we also say \Valid{\Veim{x}}.
\eqref{eq:def-eim-valid-10}
is called the
\dfn{derivation validity equivalent},
of \eqref{eq:def-eim-valid-5}.
\eqref{eq:def-eim-valid-5}
is called either the
\dfn{parse instance validity equivalent}
or the \dfn{EIM validity equivalent}
of \eqref{eq:def-eim-valid-10}.
When it is clear in context,
we will use a more simple term,
\dfn{validity equivalent}, for
a derivation validity equivalent,
a EIM validity equivalent,
or a parse instance validity equivalent.
\end{definition}

The following definitions will be useful
when relating EIM's to their validity equivalents.
\begin{definition}
\dtitle{EIM validity equivalent}
\label{def:eim-validity-equivalent}
Without loss of generality,
let
\begin{equation}
\label{eq:eim-validity-equivalent-5}
\Veim{eim} = \bigl[[\Vsym{A} \de \Vstr{predot} \mydot \Vstr{postdot}], \var{i}, \var{j} \bigr]
\end{equation}
be an Earley item and
\begin{align}
\label{eq:eim-validity-equivalent-10}
& \Vsym{A} && \text{Step \var{s}} \\
& \quad \derives \; \Vmk{i} \Vstr{predot} \Vmk{j} \Vstr{postdot} \Vmk{k}
&& \text{Step \Vincr{s}}
\end{align}
be its validity equivalent.

Then we say that the derivation step
Step \var{s}
is the
\xdfn{LHS step}{LHS step!wrt an EIM}
of \Veim{eim}.
We say that the derivation step
Step \Vincr{s}
is the
\xdfn{RHS step}{RHS step!wrt an EIM}
of \Veim{eim}.
When we refer to the ``step'' associated with an
EIM without specifing whether LHS or RHS,
we will mean the RHS step.
For example,
when we count derivation steps
between EIM's,
we will regard an EIM
as being located at its RHS step.

We say that
\[
\Vmk{i} \Vsym{A} \Vmk{k}
\]
is the
\xdfn{LHS derivation symbol instance}{LHS derivation symbol instance!wrt an EIM},
or more simply
\xdfn{LHS derivation instance}{LHS derivation instance!wrt an EIM},
of \Veim{eim}.
We say that the derivation symbol instances in
\[
\Vmk{i} \Vstr{predot} \Vstr{postdot} \Vmk{k}
\]
are the
\xdfn{RHS derivation symbol instances}{RHS derivation symbol instances!wrt an EIM},
or more simply
\xdfn{RHS derivation instances}{RHS derivation instances!wrt an EIM},
of \Veim{eim}.
And we say that \Vloc{j} is the
\xdfn{dot location in the derivation}{dot location in the derivation!wrt an EIM},
or when it is clear in context,
the \xdfn{dot location}{dot location!wrt an EIM in a derivation},
of \Veim{eim}.

We will write \Vop{Valid-eq}{x}%
\index{recce-notation}{Valid-eq(x)@\Vop{Valid-eq}{x}}
for the
validity equivalent of \var{x}.
This notation is overloaded ---
\var{x} may be a derivation move or a parse
instance,
and \Vop{Valid-eq}{x} may mean
a derivation validity equivalent,
an EIM validity equivalent,
or a parse instance validity equivalent,
according to its usage in context.
\end{definition}

\begin{definition}
\label{def:4-tuple-eim}
\dtitle{EIM 4-tuple notation}
We will sometimes find it convenient to express EIM's in terms of
derivations,
as 4-tuples:
\begin{equation}
\label{eq:def-4-tuple-eim-10}
\Veim{eim} = \big\langle \var{s}, \var{rha}, \var{rhz}, \var{dotix} \big\rangle
\end{equation}
where \var{s} is the RHS derivation step of \Veim{eim},
the sequence
\[
\drv{d}{\var{s}}{\var{rha} \ldots{} \var{rhz}}
\]
is the RHS of \Veim{eim},
and \var{dotix} is the dot index of \Veim{eim}.

When $\var{dotix} > 0$,
\Veim{eim} expressed in our more usual notation will be
\begin{equation}
\label{eq:def-4-tuple-eim-20}
\Veim{eim} = \big[ [ \Vsym{LH} \de \Vstr{prefix} \mydot \Vstr{suffix} ], \Vloc{i}, \Vloc{j} ],
\end{equation}
where
\eqref{eq:def-4-tuple-eim-20}
\begin{align}
\Vstr{prefix} & =
\begin{cases}
\begin{aligned}
& \Symbol{\drv{d}{\var{s}}{\var{rha} \ldots \var{rha}+\Vdecr{dotix}}} \\
& \qquad \text{if $\var{dotix} > 0$,} \\
& \epsilon, \quad \text{otherwise},
\end{aligned}
\end{cases} \\
\Vstr{suffix} & = \Symbol{\drv{d}{\var{s}}{\var{rha}+\var{dotix} \ldots \var{rhz}}}, \\
 \Vloc{i} & = \Left{\drvVV{d}{s}{rha}} \quad \text{and} \\
 \Vloc{j} & = \Left{\drv{d}{\var{s}}{\var{rha}+\var{dotix}}}.
\end{align}
Also, if \var{s} is the first derivation step at which the
symbol instances
\drv{d}{\var{s}}{\var{rha} \ldots{} \var{rhz}}
appear,
so that they are direct descendants of a parent symbol instance
in derivation step \Vdecr{s},
then
\begin{equation}
\Vsym{LH} = \Symbol{\drv{d}{\Vdecr{s}}{\var{rha}}}
\end{equation}
\end{definition}


\begin{theorem}\label{t:start-eim-is-valid}
\ttitle{Start Earley item is valid}
The start Earley item is valid.
\end{theorem}

\begin{proof}
By the definition of EIM validity,
to show that the start EIM
\eqref{eq:def-start-eim-10}
is valid,
we need to show
that
\begin{equation}
\label{eq:start-eim-is-valid-15}
\Vsym{accept} \derives \mk{0}\; \Vsym{start} \\
\end{equation}
By the definition of \Vsym{accept},
it is on the LHS of only one rule,
\eqref{eq:accept-rule-def-10}.
All symbols in \Cg{} are productive,
so that
\begin{equation}
\label{eq:start-eim-is-valid-16}
\Vsym{accept} \derives \Vsym{start} \destar \Vstr{sent}
\end{equation}
where \Vstr{sent} is a sentence.
Since \Vstr{sent} is a sentence,
using \eqref{eq:def-L-g-10},
we have that
\begin{equation*}
\Vstr{sent} \in \myL{\Cg}.
\end{equation*}
Our convention is that \Cw{}
is the input, or sentence, of interest in
context, so here we assume that,
without loss of generalization,
\begin{equation}
\label{eq:start-eim-is-valid-18}
\Vstr{sent} = \Cw = \Cw[0, \Vdecr{\Vsize{\Cw}}].
\end{equation}
From
\eqref{eq:start-eim-is-valid-16}
and
\eqref{eq:start-eim-is-valid-18},
we have
\begin{align}
& \Vsym{accept} \derives \Vstr{start} \destar \Cw[0, \Vdecr{\Vsize{\Cw}}] \notag\\
\therefore \quad & \Vsym{accept} \derives \Vstr{start} \destar \mk{0} \; \Cw[0, \Vdecr{\Vsize{\Cw}}] \notag\\
\therefore \quad & \Vsym{accept} \derives \mk{0} \Vstr{start} \destar \mk{0} \; \Cw[0, \Vdecr{\Vsize{\Cw}}] \notag\\
\label{eq:start-eim-is-valid-25}
\therefore \quad & \Vsym{accept} \derives \mk{0} \Vstr{start}
\end{align}
Where
\eqref{eq:start-eim-is-valid-25}
is
\eqref{eq:start-eim-is-valid-15},
which is what we needed to show for the theorem.
\end{proof}

\section{Parse instances}

A \dfn{parse instance} is either a symbol instance or an EIM.
When it is clear in context, we will often say ``symbol''
when we mean ``symbol instance''.
A parse instance is often called simply an \dfn{instance}.

\begin{definition}
\dtitle{Symbolic and EIM equivalent}
\label{def:symbolic-and-eim-equivalent}
If a parse instance is a symbol instance or
a complete EIM,
its ``symbolic equivalent'' is defined.
If the parse instance is a symbol instance,
it is its own \dfn{symbolic equivalent}.
If the parse instance is a complete EIM,
call it \Veim{e},
then its \dfn{symbolic equivalent} is
\begin{gather*}
  \Vmkl{left} \Vsym{sym} \Vmkr{right}, \\
  \begin{aligned}
& \text{where} \; & \Vmk{left} & = \Left{\Veim{e}}, \\
                 && \Vmk{right} & = \Right{\Veim{e}}, \; \text{and} \\
                 && \Vsym{sym} & = \Symbol{\Veim{e}}.
  \end{aligned}
\end{gather*}
We also write the symbolic
equivalent of \var{x} as
$\SymEq{\var{x}}$.%
\index{recce-notation}{SymEq(x)@\SymEq{\var{x}}}
We say that \Veim{eim} is the
\dfn{EIM equivalent}
of \Vinst{x} if and only if
\Vinst{x} is the symbolic equivalent of
\Veim{eim}.
We also write the EIM
equivalent of \Vinst{x} as
$\var{EIM-Eq}(\var{x})$.%
\index{recce-notation}{EIM-Eq(x)@\Vop{EIM-Eq}{x}}
\end{definition}

By way of illustration,
and with full generality, if
a complete EIM is
\begin{equation}
\label{eq:def-symbolic-equivalent-10}
\Veim{up} = \big[
[ \Vsym{up} \de \Vstr{up-rhs} \mydot ], \var{i}, \var{j}
\big].
\end{equation}
then the symbolic equivalent of \Veim{up} is
\begin{equation}
\label{eq:def-symbolic-equivalent-20}
\Vinst{ins} = \Vmkl{i} \Vsym{up} \Vmkr{j}.
\end{equation}

\begin{theorem}
\ttitle{Symbolic equivalent from complete EIM}
\label{t:valid-symbolic-equivalent-from-eim}
A valid, complete EIM has a valid symbolic equivalent,
\Vinst{symeq};
and \Symbol{\Vinst{symeq}} is
a non-terminal.
\end{theorem}

\begin{proof}
Without loss of generality,
let the complete  EIM be
\begin{equation}
\notag
\Veim{up} = \big[
[ \Vsym{up} \de \Vstr{up-rhs} \mydot ], \var{i}, \var{j}
\big].
\end{equation}
\Veim{up} is valid by assumption for the theorem,
so we have the valid derivations,
\begin{alignat}{3}
& \Vsym{up} && \derives
[ \var{i}]\, \Vstr{up-rhs} \,[\var{j}] \\
\therefore \quad
& [\var{i}]\, \Vsym{up} \,[\var{j}] && \derives
[\var{i}]\, \Vstr{up-rhs} \,[\var{j}] \\
\label{eq:valid-symbolic-equivalent-from-eim-20}
\therefore \quad
& [\var{i}]\, \Vsym{up} \,[\var{j}] &&
\end{alignat}
We have shown that
\eqref{eq:valid-symbolic-equivalent-from-eim-20}
is valid.
Let \Vinst{symeq} be
the parse instance of
\eqref{eq:valid-symbolic-equivalent-from-eim-20},
so that
$\Vinst{symeq}
= [\var{i}]\, \Vsym{up} \,[\var{j}].$
From the definition of symbolic equivalent we
see that
\Vinst{symeq}
is the symbolic equivalent of
\Veim{up}.

It remains to show that
\Symbol{\Vinst{symeq}} is a non-terminal.
We note that
$\Symbol{\Vinst{symeq}} = \LHS{\Veim{up}}$,
and with this, we have the theorem.
\end{proof}

\begin{theorem}
\ttitle{Symbolic equivalent from complete EIM}
\label{t:eim-equivalent-from-non-terminal}
A valid instance, \Vinst{x}, has an valid EIM equivalent if
and only if \Symbol{\Vinst{x}} is a non-terminal.
\end{theorem}

\begin{proof}
We have the ``if'' direction directly from the
definition of validity for non-terminal parse instances,
Theorem
\ref{t:valid-symbolic-equivalent-from-eim}
shows the ``only if'' direction.
\end{proof}

\section{Top-down and bottom-up causes}

We referred to top-down and bottom-up causes earlier,
when introducing dotted rules.
We now revisit these concepts in the context of Earley items.

\begin{definition}
\dtitle{Matching causes}
\label{def:matching-causes}
Let \Veim{down}
be an quasi-incomplete EIM
and let \Vinst{up}
be a symbolic parse instance.
We say that \Veim{down} and \Vinst{up}
are
\qdfn{matching causes}%
\index{recce-definitions}{matching causes|myixentry{\emph{see} match \emph{and} matching}}
if and only if
\begin{gather*}
\PLSY{\Veim{down}} = \LSY{\Vinst{up}}.
\end{gather*}
We say that the duple
\[
    [ \Veim{down}, \Vinst{up} ]
\]
is a \qdfn{cause-pair}.%
\index{recce-definitions}{cause-pair|myixentry{\emph{see} match \emph{and} matching}}

When $[ \Veim{down}, \Vinst{up} ]$ is a cause-pair,
we say that
\Veim{down} and \Vinst{up} \qdfn{match}.%
\index{recce-definitions}{match!between an EIM and an INST}
We call \Veim{down} the
\xdfn{top-down cause}{top-down cause!EIM, in a cause-pair}%
\index{recce-definitions}{matching!EIM, of an INST}
of the cause-pair, and
we call \Vinst{up} the
\xdfn{bottom-up cause}{bottom-up cause!INST, in a cause-pair}.%
\index{recce-definitions}{matching!INST, of an EIM}
of the cause-pair.

Let $\var{pair} = [\Veim{down}, \Veim{up}]$
be an ordered pair of EIM's.
We say that the
\Veim{down} and \Veim{up}
are \qdfn{matching causes}
if and only if
\Veim{down} and \SymEq{\Veim{up}}
are matching causes.
We call the duple
\[
    [ \Veim{down}, \Veim{up} ]
\]
a \qdfn{cause-pair}.%
\index{recce-definitions}{cause-pair|myixentry{\emph{see} match \emph{and} matching}}
When $[ \Veim{down}, \Veim{up} ]$
is a cause-pair,
we say that
\Veim{down} and \Veim{up} match.%
\index{recce-definitions}{match!between two EIM's}
We call \Veim{down} the
\xdfn{top-down cause}{top-down cause!EIM, in a cause-pair}%
\index{recce-definitions}{matching!EIM, of another EIM}
of \var{pair}, and
we call \Veim{up} the
\xdfn{bottom-up cause}{bottom-up cause!EIM, in a cause-pair}%
\index{recce-definitions}{matching!EIM, of another EIM}
of \var{pair}.

We say that a cause-pair is
\xdfn{valid}{valid!of a cause-pair}
if both its top-down cause
and its bottom-up cause are valid.
\end{definition}

\begin{definition}
\dtitle{Causes of confirmed EIM's}
\label{def:causes-confirmed}
Let
\[
   \var{pair} = [ \Veim{down}, \Vinst{up} ]
\]
be a valid cause-pair.
We say that \Veim{effect} is the
\xdfn{effect}{effect!EIM, as the
   effect of another EIM and an INST}
of \Veim{down} and \Vinst{up}
if and only if these two conditions hold:
\begin{gather*}
\Veim{effect} =
\left[
\begin{gathered}
\Next{\DR{\Veim{down}}}, \\
\Left{\Veim{down}}, \Current{\Vinst{up}}
\end{gathered}
\right]
\; \text{and}
\\
\Predot{\Veim{effect}} = \Symbol{\Vinst{up}}.
\end{gather*}
If and only if \Veim{effect} is the effect 
of \var{pair},
we also say that
\begin{itemize}
\item
\Veim{down} is a
\xdfn{top-down cause}{top-down cause!EIM as top-down cause of a confirmed EIM}
of \Veim{effect}.
\item
\Vinst{up} is a
\xdfn{bottom-up cause}{bottom-up cause!INST as bottom-up cause of a confirmed EIM}
of \Veim{effect}.
\item
if $\SymEq{\Veim{up}} = \Vinst{up}$, that
\Veim{up} is a
\xdfn{bottom-up cause}{bottom-up cause!EIM as bottom-up cause of a confirmed EIM}
of \Veim{effect}.
\end{itemize}
\end{definition}

\begin{definition}
\dtitle{Causes of predicted EIM's}
\label{def:causes-predicted}
If \Veim{effect} is a prediction,
\Vdr{down}
is any top-down dotted rule cause of \DR{\Veim{effect}},
and \Vloc{i} is any location,
we say that every
\begin{gather*}
\Veim{down} = [ \Vdr{down}, \var{i}, \Current{\Veim{effect}} ]
\end{gather*}
is a
\xdfn{top-down cause}{top-down cause!EIM as top-down cause of a predicted EIM}
of \Veim{effect}.
We say that the
\xdfn{bottom-up cause}{bottom-up cause!bottom-up cause of a predicted EIM}
of \Veim{effect} is ethereal.
We call \Veim{effect} the
\xdfn{effect}{effect!predicted EIM, as the effect of another EIM}
of \Veim{down}.
\end{definition}

We say that a bottom-up cause is \dfn{symbolic},
if it has a symbolic equivalent.
The bottom-up causes of predictions
do not have a symbolic equivalent,
and are therefore not symbolic.
All other bottom-up causes are symbolic.

\begin{theorem}
\ttitle{Completed EIM as a cause}
\label{t:completed-eim-as-a-cause}
If a completed EIM is a cause of another EIM,
then it is the bottom-up cause in a pair
of matching causes,
and its effect is
a confirmed EIM.
\end{theorem}

\begin{proof}
Let \Veim{comp} be a completed EIM,
and let \Veim{eff} be its effect.
We proceed by cases.

\textbf{Top-down cause of a prediction}:
If \Veim{eff} has no predot symbol,
then the top-down cause of its dotted
rule is an incomplete dotted rule
\dref[top-down cause of a predicted dotted rule]{def:causes-predicted-dr},
so that the top-down cause of \Veim{eff} must be an incomplete EIM.
\Veim{comp} is, by assumption for the theorem, a complete EIM
so that \Veim{comp} is not the top-down cause of \Veim{eff}.

\textbf{Bottom-up cause of a prediction}:
If \Veim{eff} has no predot symbol,
then its bottom-up cause is ethereal
\dref[causes of a predicted EIM]{def:causes-predicted}.
\Veim{comp} is clearly not ethereal,
so that \Veim{comp} is not the bottom-up cause of \Veim{eff}.

\textbf{Top-down cause of a confirmation}:
If \Veim{eff} has a predot symbol,
its causes are in a pair of matching causes
\dref[causes of a confirmed EIM]{def:causes-confirmed}.
The top-down cause of a pair of matching causes
must be quasi-complete
\dref{def:matching-causes}.
By assumption for the theorem,
\Veim{comp} is complete,
so that 
\Veim{comp} is not the top-down cause of \Veim{eff}.

\textbf{Bottom-up cause of a confirmation}:
This is the only remaining case, so that if \Veim{comp}
is a cause of \Veim{eff},
it must fall into this case.
This shows the theorem.
\end{proof}

\begin{theorem}
\ttitle{Incomplete EIM as a cause}
\label{t:incomplete-eim-as-cause}
Assume that
\begin{subequations}
\renewcommand{\theequation}{A\arabic{equation}}
\begin{align}
\label{t:incomplete-eim-as-cause-asm-1}
& \myparbox{%
There exist two valid EIM's,
\Veim{cuz} and \Veim{eff},
such that \Veim{cuz}
is the cause of \Veim{eff}.
} \\
\label{t:incomplete-eim-as-cause-asm-2}
& \myparbox{%
\Veim{cuz} is incomplete.
}
\end{align}
\end{subequations}
Given these assumptions, then
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{t:incomplete-eim-as-cause-req-1}
& \myparbox{%
\Veim{cuz} is never the bottom-up cause of any effect.
} \\
\label{t:incomplete-eim-as-cause-req-2}
& \myparbox{%
\Veim{cuz} is a top-down cause of \Veim{eff}.
} \\
\label{t:incomplete-eim-as-cause-req-3a}
& \myparbox{%
If \Veim{eff} is a confirmed EIM,
then it is the effect of the cause-pair
$[ \Veim{cuz}, \Vinst{up} ]$,
where \Vinst{up} is a parse instance.
} \\
\label{t:incomplete-eim-as-cause-req-3b}
& \myparbox{
If \Veim{eff} is a predicted EIM,
then its
top-down cause is \Veim{cuz}
and its bottom-up cause is ethereal.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
\begin{align}
\label{eq:incomplete-eim-as-cause-10}
& \myparbox{%
If \Veim{eff} is a prediction, it's
bottom-up cause is not an EIM
\becuz{}
\dref[causes of a predicted EIM]{def:causes-predicted}.
} \\
\label{eq:incomplete-eim-as-cause-12}
& \myparbox{%
If \Veim{eff} is a prediction,
\Veim{cuz} is not the bottom-up
cause of \Veim{eim}
\becuz{}
\eqref{t:incomplete-eim-as-cause-asm-1},
\eqref{eq:incomplete-eim-as-cause-10}.
} \\
\label{eq:incomplete-eim-as-cause-14}
& \myparbox{%
If \Veim{eff} is confirmed, it's
bottom-up cause is a complete EIM.
\becuz{}
\dref[causes of a confirmed EIM]{def:causes-confirmed}.
} \\
\label{eq:incomplete-eim-as-cause-16}
& \myparbox{%
If \Veim{eff} is confirmed, \Veim{cuz}
is not its bottom-up cause.
\becuz{}
\eqref{t:incomplete-eim-as-cause-asm-1},
\eqref{t:incomplete-eim-as-cause-asm-2},
\eqref{eq:incomplete-eim-as-cause-14}.
}
\intertext{%
Since every EIM is either confirmed or
a prediction,
}
\label{eq:incomplete-eim-as-cause-18}
& \myparbox{%
\Veim{cuz}
is never a bottom-up cause.
\becuz{}
\eqref{eq:incomplete-eim-as-cause-12},
\eqref{eq:incomplete-eim-as-cause-16},
which is
Requirement~\eqref{t:incomplete-eim-as-cause-req-1}
of this theorem.
} \\
\label{t:incomplete-eim-as-cause-30}
& \myparbox{%
\Veim{cuz} is a top-down cause of \Veim{eff}
\becuz{}
\eqref{eq:incomplete-eim-as-cause-18},
which is
Requirement~\eqref{t:incomplete-eim-as-cause-req-2}
of this theorem.
} \\
\label{t:incomplete-eim-as-cause-40}
& \myparbox{%
If \Veim{eff} is a confirmed EIM,
then it is the effect of the cause-pair
$[ \Veim{cuz}, \Vinst{up} ]$,
where \Vinst{up} is a parse instance
\becuz{}
\eqref{t:incomplete-eim-as-cause-30},
\dref[causes of a confirmed EIM]{def:causes-confirmed},
which is
Requirement~\eqref{t:incomplete-eim-as-cause-req-3a}
of this theorem.
} \\
\label{t:incomplete-eim-as-cause-50}
& \myparbox{
If \Veim{eff} is a predicted EIM,
then its
top-down cause is \Veim{cuz}
and its bottom-up cause is ethereal
\becuz{}
\eqref{t:incomplete-eim-as-cause-30},
\dref[causes of a predicted EIM]{def:causes-predicted},
which is
Requirement~\eqref{t:incomplete-eim-as-cause-req-3b}
of this theorem. \qedhere
}
\end{align}
\end{proof}

\begin{definition}
\dtitle{Ancestors}
\label{def:ancestor}
%
% TODO: Do I need or use this definition?
%
We say that \Veim{anc} is the \dfn{top-down ancestor}
of \Veim{desc},
if \Veim{anc} is a top-down cause of \Veim{desc},
or if \Veim{anc} is the top-down cause of an ancestor of \Veim{desc}.
If \Veim{anc} is a top-down ancestor of \Veim{desc},
then we say the
\Veim{desc}
is a \dfn{top-down descendant} of \Veim{anc}.
\end{definition}

An effect is always an Earley item.
A top-down cause is always an Earley item.
A bottom-up cause may be ethereal or telluric.

If a bottom-up cause is ethereal, it may be because the effect has no
predot symbol,
or because the bottom-up cause is a nulling terminal symbol instance.
If a bottom-up cause is telluric, it may be because it is
an Earley item,
because it is a non-terminal symbol instance,
or because it is a telluric terminal symbol instance.
Recall that rules in \Marpa{} cannot be
nulling,
and therefore Earley items
and non-terminal symbol instances cannot be nulling.

We have already defined validity for Earley items.
We now extend the concept of validity to other types of
causes.
An ethereal cause is always valid.

\begin{definition}
\dtitle{Validity of terminal symbols}
If \Vsym{T} is a telluric terminal symbol,
and if \CW{} has been seen as far as \Vloc{j}.
we say that
\begin{equation}
\label{eq:def-terminal-validity-10}
[\var{i}]\, \Vsym{T} \,[\var{j}]
\end{equation}
is
\xdfn{valid}{valid (terminal symbol)}
if and only if
\begin{equation}
\label{eq:def-terminal-validity-15}
\Vsym{T} = \CVw{i} \; \land \; \var{j} = \var{i} + 1.
\end{equation}
\eqref{eq:def-terminal-validity-10}
is considered to be the
\xdfn{derivation validity equivalent}{derivation validity equivalent (terminal symbol)!wrt itself}
of itself.
When it is clear in context,
we will also call
\eqref{eq:def-terminal-validity-10}
the
\xdfn{validity equivalent}{validity equivalent (terminal symbol)!wrt itself}
of itself.
Overloading our previous use of \myfnname{Valid-eq},
we write \Vop{Valid-eq}{x}%
\index{recce-notation}{Valid-eq(x)@\Vop{Valid-eq}{x}}
for the
validity equivalent
of the terminal symbol instance \Vinst{x}.
\end{definition}

\begin{definition}
\label{def:validity-of-non-terminal}
\dtitle{Validity of non-terminal symbols}
If \Vsym{N} is a non-terminal symbol,
we say that
\begin{equation}
\label{eq:def-non-terminal-validity-10}
\Vinst{N-ins} = [\var{i}]\, \Vsym{N} \,[\var{j}]
\end{equation}
is
\xdfn{valid}{valid (non-terminal symbol)}
if and only if
it is the LHS of a valid, completed EIM.
\Vinst{N-ins} is considered to be the
\xdfn{derivation validity equivalent}{derivation validity equivalent
  (of non-terminal symbol)}
of itself.
When it is clear in context,
we will use the term,
\xdfn{validity equivalent}{validity equivalent},
for the derivation validity equivalent of a
non-terminal symbol.
Also,
overloading our previous use of \myfnname{Valid-eq},
we will write \Vop{Valid-eq}{x}%
\index{recce-notation}{Valid-eq(x)@\Vop{Valid-eq}{x}}
for validity equivalent
of a non-terminal symbol.
\end{definition}

\section{Confirmed Earley items}

\begin{theorem}
\ttitle{Effect from symbolic cause-pair}
\label{t:effect-from-symbolic-cause-pair}
A cause-pair, both of whose causes are symbolic,
has exactly one valid effect.
\end{theorem}

\begin{proof}
Without loss of generality,
let the top-down cause be
\begin{equation}
\label{eq:effect-from-symbolic-cause-pair-3}
\begin{split}
& \Veim{down} =  \\
& \qquad \qquad [ [ \Vsym{down} \de \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j} ].
\end{split}
\end{equation}
and let the symbolic equivalent of the bottom-up cause be
\begin{equation}
\label{eq:effect-from-symbolic-cause-pair-6}
\,[\var{j}]\, \Vsym{A} \,[\var{k}]\, .
\end{equation}
The effect of \Veim{down} and \eqref{eq:effect-from-symbolic-cause-pair-6}
will be
\begin{equation}
\label{eq:effect-from-symbolic-cause-pair-9}
\begin{split}
& \Veim{effect} =  \\
& \qquad \qquad [ [ \Vsym{down} \de \Vstr{pre} \cat \Vsym{A} \mydot \Vstr{post} ], \var{i}, \var{k} ].
\end{split}
\end{equation}
\Veim{effect} is fully determined by
\Veim{down} and \eqref{eq:effect-from-symbolic-cause-pair-6}
and is therefore unique.

It remains to show that \Veim{effect}
is valid.
By the definition of validity for an Earley item,
we will have shown this if we can show that
\begin{equation}
\label{eq:effect-from-symbolic-cause-pair-12}
\Vsym{down} \derives [\var{i}] \Vstr{pre} \cat \Vstr{A} [\var{k}] \Vstr{post}.
\end{equation}

By assumption,
\eqref{eq:effect-from-symbolic-cause-pair-3}
is valid.
From the definition of validity for an Earley item:
\begin{equation}
\label{eq:effect-from-symbolic-cause-pair-20}
\Vsym{down} \derives [\var{i}]\, \Vstr{pre} \,[\var{j}]\, \Vsym{A} \cat \Vstr{post}
\end{equation}

We see that the location markers in
\eqref{eq:effect-from-symbolic-cause-pair-6}
and
\eqref{eq:effect-from-symbolic-cause-pair-20}
are compatible:
\var{i} and \var{k} are unrestricted,
while the use of \var{j} in both derivations is compatible.
Composing them we have
\begin{alignat}{2}
\label{eq:effect-from-symbolic-cause-pair-25}
& \Vsym{down} \derives [\var{i}]\, \Vstr{pre} \,[\var{j}]\, \Vsym{A} \,[\var{k}]\, \Vstr{post} \\
\therefore \quad & \Vsym{down} \derives [\var{i}]\, \Vstr{pre} \cat \Vsym{A} \,[\var{k}]\, \Vstr{post}
\label{eq:effect-from-symbolic-cause-pair-28}
\end{alignat}
Where
\eqref{eq:effect-from-symbolic-cause-pair-28}
is
\eqref{eq:effect-from-symbolic-cause-pair-12},
which is what we needed to show for the theorem.
\end{proof}

\begin{theorem}
\ttitle{Null-scan from top-down cause}
\label{t:null-scan-from-down-cause}
Let
\[
[ \Vsym{A} \de \Vstr{prf} \Vsym{nul} \Vstr{suf} ]
\]
be a rule in \Cg{}
such that
$\Vsym{nul} = \epsilon$.
Then, for some \Vloc{i}, \Vloc{k},
\begin{equation}
\label{eq:null-scan-from-down-cause-5}
\Veim{down} = \big[ [ \Vsym{A} \de \Vstr{prf} \mydot \Vsym{nul} \Vstr{suf} ],
\var{i}, \var{k} \big]
\end{equation}
is valid
if and only if
\begin{equation}
\label{eq:null-scan-from-down-cause-8}
\Veim{eff} = \big[ [ \Vsym{A} \de \Vstr{prf} \Vsym{nul} \mydot \Vstr{suf} ],
\var{i}, \var{k} \big]
\end{equation}
is valid.
Also,
\Veim{down} is the unique valid top-down cause of \Veim{eff};
and
\Veim{eff} is the unique valid effect of \Veim{down}.
\end{theorem}

\begin{proof}
To show the ``if'' direction, we assume
\eqref{eq:null-scan-from-down-cause-8}.
Using the definition of EIM validity
and
\eqref{eq:null-scan-from-down-cause-8},
we see that
\begin{equation}
\label{eq:null-scan-from-down-cause-20}
\Vsym{A} \derives \Vmk{i} \Vstr{prf} \Vsym{nul} \Vmk{k} \Vstr{suf}.
\end{equation}
Moving \Vmk{k} in
\eqref{eq:null-scan-from-down-cause-20}
to the other side of the nulling symbol produces
\begin{equation}
\label{eq:null-scan-from-down-cause-23}
\Vsym{A} \derives \Vmk{i} \Vstr{prf} \Vmk{k} \Vsym{nul} \Vstr{suf}.
\end{equation}
\eqref{eq:null-scan-from-down-cause-5}
follows from
\eqref{eq:null-scan-from-down-cause-23},
by EIM validity.

The proof of the ``only if'' direction is symmetric.
The
\Veim{down} is valid by assumption, so
from
\eqref{eq:null-scan-from-down-cause-5}
we have
\begin{equation}
\label{eq:null-scan-from-down-cause-30}
\Vsym{A} \derives \Vmk{i} \Vstr{prf} \Vmk{k} \Vsym{nul} \Vstr{suf}.
\end{equation}
Moving \Vmk{k} in
\eqref{eq:null-scan-from-down-cause-30}
to the other side of the nulling symbol produces
\begin{equation}
\label{eq:null-scan-from-down-cause-33}
\Vsym{A} \derives \Vmk{i} \Vstr{prf} \Vsym{nul} \Vmk{k} \Vstr{suf},
\end{equation}
\eqref{eq:null-scan-from-down-cause-8}
follows from
\eqref{eq:null-scan-from-down-cause-33}
by EIM validity.

By the definition of top-down cause applied to a null-scan,
we see that,
if \Veim{cuz} is a valid top-down cause of
a null-scan effect,
then that effect must be
\begin{equation}
\notag
\label{eq:null-scan-from-down-cause-40}
     \Veim{eff} =
\left[
\begin{gathered}
\Next{\DR{\Veim{cuz}}}, \\
\Left{\Veim{cuz}}, \Current{\Veim{cuz}}
\end{gathered}
\right],
\end{equation}
so that \Veim{eff} is a function of \Veim{cuz}
and therefore unique.

Again considering
the definition of top-down causes as applied to null-scans,
we see that
if \Veim{eff} is a valid null-scanned effect,
then its top-down cause must be
\begin{equation}
\notag
\label{eq:null-scan-from-down-cause-45}
     \Veim{cuz} =
\left[
\begin{gathered}
\Prev{\DR{\Veim{eff}}}, \\
\Left{\Veim{eff}}, \Current{\Veim{eff}}
\end{gathered}
\right],
\end{equation}
so that \Veim{cuz} is a function of \Veim{eff}
and therefore unique.
\end{proof}

\begin{theorem}
\ttitle{Confirmation from bottom-up cause}
\label{t:confirmation-from-up-cause}
Let \Veim{eff} be an EIM.
If the bottom-up cause of \Veim{eff} is a non-nulling
terminal or an EIM,
then \Veim{eff} is a confirmation.
\end{theorem}

\begin{proof}
This theorem follows directly from
\tref{t:completed-eim-as-a-cause}.
\end{proof}

\begin{theorem}
\ttitle{Causes of confirmed effect}
\label{t:symbolic-causes-from-effect}
If
\[\Veim{effect} = [ \Vdr{effect}, \var{i}, \var{k} ],\]
is a valid, confirmed EIM,
then
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:symbolic-causes-from-effect-3}
& \myparbox{%
\Veim{effect} must have a valid symbolic bottom-up cause,
call it $\Vinst{up}$.
} \\
\label{eq:symbolic-causes-from-effect-6}
& \myparbox{%
\Veim{effect} must have a valid top-down cause,
call it $\Veim{down}$.
} \\
\label{eq:symbolic-causes-from-effect-9}
& \myparbox{%
\Vinst{up} and \Veim{down} must be matching causes.
}
\intertext{%
And, for every matching pair of causes,
where we call the top-down cause \Veim{down},
and we call the bottom-up cause \Vinst{up}.
}
\label{eq:symbolic-causes-from-effect-12}
& \myparbox{%
$\Right{\Vinst{up}}  = \Vloc{k}$.
} \\
\label{eq:symbolic-causes-from-effect-15}
& \myparbox{%
$\Left{\Veim{down}} = \Vloc{i}$.
} \\
\label{eq:symbolic-causes-from-effect-18}
& \myparbox{%
$\Symbol{\Vinst{up}} = \Predot{\Veim{effect}}$.
} \\
\label{eq:symbolic-causes-from-effect-19}
& \myparbox{%
$\Predot{\Veim{effect}} = \Postdot{\Veim{down}}$.
} \\
\label{eq:symbolic-causes-from-effect-21}
& \myparbox{%
$\Next{\Vdr{down}} = \Vdr{effect}$.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
Without loss of generality,
let \Veim{effect} be
\begin{equation}
\label{eq:symbolic-causes-from-effect-20}
\Veim{effect} =
\big[ [ \Vsym{down} \de \Vstr{pre} \cat \Vsym{A} \mydot \Vstr{post} ], \var{i}, \var{k}
\big].
\end{equation}
By
\dref[causes of a confirmed EIM]{def:causes-confirmed},
the bottom-up cause of \Veim{effect} is
\begin{equation}
\label{eq:symbolic-causes-from-effect-25}
\Vinst{up} = \Vmkl{j} \Vstr{A} \Vmkr{k},
\end{equation}
and the top-down cause is
\begin{equation}
\label{eq:symbolic-causes-from-effect-30}
\Veim{down} = [ [ \Vsym{down} \derives \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j} ].
\end{equation}
The statement of \Vinst{up} and \Veim{down} in
\eqref{eq:symbolic-causes-from-effect-25} and
\eqref{eq:symbolic-causes-from-effect-30}
is without loss of generality.

Trivially, we can see that
\eqref{eq:symbolic-causes-from-effect-20},
\eqref{eq:symbolic-causes-from-effect-25},
and
\eqref{eq:symbolic-causes-from-effect-30}
satisfy
Requirements~\eqref{eq:symbolic-causes-from-effect-9}
\eqref{eq:symbolic-causes-from-effect-12},
\eqref{eq:symbolic-causes-from-effect-15},
\eqref{eq:symbolic-causes-from-effect-18},
\eqref{eq:symbolic-causes-from-effect-19}
and
\eqref{eq:symbolic-causes-from-effect-21}
in the statement of the theorem.
It remains to show that
\eqref{eq:symbolic-causes-from-effect-25},
and
\eqref{eq:symbolic-causes-from-effect-30}
are valid.

Using
\eqref{eq:symbolic-causes-from-effect-20},
and the definition of location markers,
we have
\begin{equation}
\label{eq:symbolic-causes-from-effect-29}
\Vstr{pre} \cat \Vstr{A} \destar \var{w}[\var{i}, (\var{k} \subtract 1)],
\end{equation}
so that there must be some \Vloc{j}, $\var{i} \le \var{j} \le \var{k}$,
such that
\begin{equation}
\label{eq:symbolic-causes-from-effect-32}
\Vsym{down} \derives \Vmkl{i} \Vstr{pre} \Vmkm{j} \Vstr{A} \Vmkm{k} \Vstr{post}.
\end{equation}
Simplifying
\eqref{eq:symbolic-causes-from-effect-32},
we have
\eqref{eq:symbolic-causes-from-effect-25},
our bottom-up cause.
This shows that \Vinst{up} is valid
which was Requirement~\eqref{eq:symbolic-causes-from-effect-3}
in the statement of this theorem.

A different simplification of
\eqref{eq:symbolic-causes-from-effect-32}
produces
\begin{equation}
\label{eq:symbolic-causes-from-effect-38}
\Vsym{down} \derives \Vmkl{i} \Vstr{pre} \Vmkm{j} \Vstr{A} \cat \Vstr{post}.
\end{equation}
and
from
\eqref{eq:symbolic-causes-from-effect-38},
by the definition of EIM validity,
we have
\eqref{eq:symbolic-causes-from-effect-30}.
This shows that \Veim{down} is valid
which was
Requirement~\eqref{eq:symbolic-causes-from-effect-6},
the only remaining requirement
in the statement of this theorem.
\end{proof}

\begin{theorem}
\ttitle{Top-down cause of confirmed effect}
\label{t:down-cause-from-effect}
Let
\begin{equation*}
\Veim{effect} = [ \Vdr{effect}, \var{i}, \var{k} ]
\end{equation*}
be a valid, confirmed EIM,
then \Veim{down} is a valid, top-down cause,
such that
\begin{align}
\label{eq:down-cause-from-effect-10}
\Veim{down} & = \big[ \Prev{\Vdr{effect}}, \var{i}, \var{k} ] \\
& \qquad \text{if \Veim{effect} is a null-scan EIM,} \notag\\
\label{eq:down-cause-from-effect-13}
\Veim{down} & = \big[ \Prev{\Vdr{effect}}, \var{i}, \Vdecr{k} ] \\
& \qquad \text{if \Veim{effect} is a read EIM, and} \notag\\
\label{eq:down-cause-from-effect-16}
\Veim{down} & = \big[ \Prev{\Vdr{effect}}, \var{i}, \var{j} ] \\
& \qquad \text{where $\var{j} < \var{k}$, if \Veim{effect} is a telluric EIM.} \notag
\end{align}
\end{theorem}

\begin{proof}
The proof follows from
Theorem \ref{t:symbolic-causes-from-effect},
noting in particular the requirement that
\Veim{effect} must have
a top-down cause, \Veim{down},
and \Vinst{up},
and that they must match.
By the definition of matching causes,
\begin{equation}
\label{eq:down-cause-from-effect-20}
\Right{\Veim{down}} = \Left{\Vinst{up}}.
\end{equation}
By the definition of left and right location,
\begin{equation}
\label{eq:down-cause-from-effect-23}
\Right{\Vinst{up}} = \Left{\Vinst{up}} + \Vsize{\Vinst{up}}.
\end{equation}
Using
Theorem \ref{t:symbolic-causes-from-effect},
\begin{equation}
\label{eq:down-cause-from-effect-26}
\Right{\Veim{up}} = \Right{\Veim{effect}} = \Vloc{k}.
\end{equation}

Combining
\eqref{eq:down-cause-from-effect-20},
\eqref{eq:down-cause-from-effect-23} and
\eqref{eq:down-cause-from-effect-26},
we have
\begin{equation}
\label{eq:down-cause-from-effect-29}
\begin{aligned}
\Right{\Veim{down}} & = \Right{\Veim{effect}} \subtract \Vsize{\Vinst{up}} \\
& = \Vloc{k} \subtract \Vsize{\Vinst{up}}.
\end{aligned}
\end{equation}

If \Veim{effect} is a null-scan, then
\Vinst{up} is a nulling symbol instance,
and
$\Vsize{\Vinst{up}} = 0$,
so that we have
\eqref{eq:down-cause-from-effect-10}.

If \Veim{effect} is a null-scan, then
\Vinst{up} is a non-nulling terminal symbol instance,
and
$\Vsize{\Vinst{up}} = 1$,
so that we have
\eqref{eq:down-cause-from-effect-13}.

If \Veim{effect} is telluric, then
\Vinst{up} is a telluric symbol instance,
and
$\Vsize{\Vinst{up}} > 1$,
so that we have
\eqref{eq:down-cause-from-effect-16}.
\end{proof}

\begin{sloppypar}
\begin{FlushLeft}
\begin{theorem}
\ttitle{Effect from symbol instance}
\label{t:effect-from-symbol}
Let
\begin{equation}
\label{eq:effect-from-symbol-0}
\var{Ai} = \Vmkm{j} \Vsym{A} \Vmkm{k}
\end{equation}
be a valid symbol instance.
If $\Vsym{A} \neq \Vsym{accept}$
then we have the following:
\begin{enumerate}
\item
\label{req:effect-from-symbol-1}
\var{Ai} is the bottom-up cause of at least one valid effect.
\item
\label{req:effect-from-symbol-2}
\var{Ai} has at least one matching valid top-down cause.
\item
\label{req:effect-from-symbol-3}
If \Veim{down} is a top-down cause of \Vinst{Ai} then
$\Left{\Veim{down}} = \Left{\Vinst{Ai}}$.
\item
\label{req:effect-from-symbol-4a}
If \Veim{down} is a top-down cause of \Vinst{Ai} then
$\Vsym{A} = \Postdot{\Veim{down}}.$
\item
\label{req:effect-from-symbol-4b}
If \Veim{effect} is an effect of \Vinst{Ai} then
$\Vsym{A} = \Predot{\Veim{effect}}.$
\item
\label{req:effect-from-symbol-5}
If \Veim{down} is a top-down cause of \Vinst{Ai} then
$\PLSY{\Veim{down}} = \LSY{\Vinst{Ai}}.$
\end{enumerate}
\end{theorem}

\end{FlushLeft}
\end{sloppypar}

\begin{proof}
By assumption for the theorem,
$\Vsym{A} \neq \Vsym{accept}$.
Therefore,
there is at least one derivation step before
\eqref{eq:effect-from-symbol-0},
so that, without loss of generality, we may write
\begin{equation}
\label{eq:effect-from-symbol-9}
\Vsym{down} \destar \Vstr{pre} \Vmkm{j} \Vsym{A} \Vmkm{k} \Vstr{post}.
\end{equation}
If we let \Vloc{i} = \Right{\Vstr{pre}},
and introduce a location marker for it into
\eqref{eq:effect-from-symbol-9},
we have
\begin{equation}
\label{eq:effect-from-symbol-25}
\Vsym{down} \derives \Vmkm{i} \Vstr{pre} \Vmkm{j} \Vsym{A} \Vmkm{k} \Vstr{post}.
\end{equation}
From
\eqref{eq:effect-from-symbol-25},
and the definition of validity for an Earley item,
we know that
\begin{gather}
\label{eq:effect-from-symbol-28}
\begin{gathered}
\Veim{down} =
[ [ \Vsym{down} \de \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j} ] \\
\text{is valid; and}
\end{gathered}
\\
\label{eq:effect-from-symbol-29}
\begin{gathered}
\Veim{effect} =
[ [ \Vsym{down} \de \Vstr{pre} \cat \Vsym{A} \mydot \Vstr{post} ], \var{i}, \var{k} ]
\\
\text{is valid and confirmed.}
\end{gathered}
\end{gather}

From
\eqref{eq:effect-from-symbol-29}
and \dref[causes of confirmed EIM]{def:causes-confirmed},
we have Requirement
\ref{req:effect-from-symbol-1} of this theorem.
From
\eqref{eq:effect-from-symbol-28},
\eqref{eq:effect-from-symbol-29},
and \dref[causes of confirmed EIM]{def:causes-confirmed}
we have Requirement
\ref{req:effect-from-symbol-2} of this theorem.
\eqref{eq:effect-from-symbol-28} shows
Requirement~\ref{req:effect-from-symbol-3}.
Requirement~\ref{req:effect-from-symbol-4a}
follows from \eqref{eq:effect-from-symbol-28}.
Requirement~\ref{req:effect-from-symbol-4b}
follows from \eqref{eq:effect-from-symbol-29}.

To show
Requirement~\ref{req:effect-from-symbol-5}:
\begin{align}
\label{eq:effect-from-symbol-35}
& \Symbol{\Vinst{Ai}} = \Vsym{A} \becuz
\eqref{eq:effect-from-symbol-0}.
\\
\label{eq:effect-from-symbol-37}
& \Left{\Vinst{Ai}} = \Vloc{j} \becuz
\eqref{eq:effect-from-symbol-0}.
\\
\label{eq:effect-from-symbol-39}
& \LSY{\Vinst{Ai}} = [ \Vsym{A}, \Vloc{j} ] \becuz 
\eqref{eq:effect-from-symbol-35},
\eqref{eq:effect-from-symbol-37}.
\\
\label{eq:effect-from-symbol-42}
& \begin{aligned}
& \PLSY{\Veim{down}} = 
\left[
\begin{gathered}
\Postdot{\Veim{down}}, \\
\Current{\Veim{down}}
\end{gathered}
\right]
\\
& \qquad \qquad \becuz{} \dref[postdot locsym of an EIM]{def:postdot-locsym}.
\end{aligned}
\\
\label{eq:effect-from-symbol-44}
& \myparbox{%
\PLSY{\Veim{down}} = [ \Vsym{A}, \Vloc{j} ] \becuz{}
\eqref{eq:effect-from-symbol-28}.
}
\end{align}
Requirement~\ref{req:effect-from-symbol-5}
follows from
\eqref{eq:effect-from-symbol-39}
and
\eqref{eq:effect-from-symbol-44}.
\end{proof}

\begin{theorem}
\ttitle{Terminal bottom-up causes are unique}
\label{t:terminal-cause-unique}
Let an instance of the terminal
\Vsym{term} be the bottom-up cause of an effect,
\Veim{effect}.
Then that instance is the only
bottom-up cause of \Veim{effect}.
\end{theorem}

\begin{proof}
Since \Vsym{term} is a terminal
it cannot appear on the LHS of a rule.
Since \Vsym{term} cannot be the LHS of a rule,
by Theorem
\ref{t:eim-equivalent-from-non-terminal},
\Vinst{inst} has no EIM equivalent.
Let
\begin{equation}
\Vinst{inst1} = \Vmkm{l1} \Vsym{term} \Vmkm{r1}
\end{equation}
Assume for a reductio that
\Vinst{inst2} is another
symbolic bottom-up cause of \Veim{effect},
\begin{gather}
\Vinst{inst2} = \Vmkm{l2} \Vsym{sym2} \Vmkm{r2} \\
\label{eq:terminal-cause-unique-5}
\text{where $\var{l1} \neq \var{l2}$ or $\Vsym{term} \neq \Vsym{sym2}$ or $\var{r1} \neq \var{r2}.$}
\end{gather}

But by Theorem \ref{t:symbolic-causes-from-effect},
the bottom-up cause symbol of \Veim{effect} must be
\Predot{\Veim{effect}},
so that
\begin{equation}
\label{eq:terminal-cause-unique-10}
\Vsym{term} = \Predot{\Veim{effect}} = \Vsym{sym2}.
\end{equation}

Also by Theorem \ref{t:symbolic-causes-from-effect},
the right location of its bottom-up cause must be
\Right{\Veim{effect}}, so that
\begin{equation}
\label{eq:terminal-cause-unique-20}
\var{r1} = \Right{\Veim{effect}} = \var{r2}.
\end{equation}

Finally,
if \Vsym{term} is terminal,
it must be telluric in which case its length is 1,
or nulling, in which case its length is 0.
In either case its length is fixed.
Let $\Vsize{\Vsym{term}} = \var{len}$.
Then
\begin{equation}
\label{eq:terminal-cause-unique-30}
\var{l1} \; = \; \left(\Right{\Veim{effect}} \subtract \var{len}\right) \; = \; \var{l2}.
\end{equation}

Gathering
\eqref{eq:terminal-cause-unique-10},
\eqref{eq:terminal-cause-unique-20}
and
\eqref{eq:terminal-cause-unique-30},
we see that
\eqref{eq:terminal-cause-unique-5} is false,
which is contrary to the assumption for the reductio.
So \Vinst{inst1} must be unique.
Our choice of \Vinst{inst1} was without loss of generality,
so this shows the theorem.
\end{proof}

\section{Predictions}

\begin{theorem}
\ttitle{Prediction from top-down cause}
\label{t:prediction-from-cause}
Let
\begin{equation}
\label{eq:prediction-from-cause-3}
\Veim{down} = \big[
  [ \Vsym{down} \de \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j}
\big]
\end{equation}
be a valid EIM,
and let
\begin{equation}
\label{eq:prediction-from-cause-6}
[ \Vsym{A} \de \Vstr{A-rhs} ]
\end{equation}
be a rule in \Cg{}.
Then
\begin{equation}
\label{eq:prediction-from-cause-9}
\Veim{prediction} = \big[ [ \Vsym{A} \de \mydot \Vstr{A-rhs} ], \var{j}, \var{j}
\big]
\end{equation}
is valid.
\end{theorem}

\begin{proof}
By assumption,
\eqref{eq:prediction-from-cause-3}
is valid.
From the definition of validity for an Earley item:
\begin{equation}
\label{eq:prediction-from-cause-20}
\Vsym{down} \derives [\var{i}]\, \Vstr{pre} \,[\var{j}]\, \Vsym{A} \cat \Vstr{post}
\end{equation}
Using
\eqref{eq:prediction-from-cause-6}
and
\eqref{eq:prediction-from-cause-20},
and expanding \Vsym{A} into its
direct descendants,
we have
\begin{equation}
\label{eq:prediction-from-cause-25}
\begin{split}
\Vsym{down} \; & \derives \; \Vmk{i} \Vstr{pre} \Vmk{j} \Vsym{A} \Vstr{post} \\
    & \derives \; \Vmk{i} \Vstr{pre} \Vmk{j} \Vsym{A-rhs} \Vstr{post}.
\end{split}
\end{equation}

Simplifying
\eqref{eq:prediction-from-cause-25},
we have
\begin{equation}
\label{eq:prediction-from-cause-12}
\Vsym{A} \derives [\var{j}] \Vstr{A-rhs}.
\end{equation}
By the definition of validity for an Earley item,
this shows
\eqref{eq:prediction-from-cause-9},
and therefore the theorem.
\end{proof}

\begin{theorem}
\ttitle{Top-down cause from prediction}
\label{t:cause-from-prediction}
Let
\begin{equation}
\label{eq:cause-from-prediction-1}
\Veim{prediction} = \big[ [ \Vsym{A} \de \mydot \Vstr{A-rhs} ], \var{j}, \var{j}
\big]
\end{equation}
be a predicted EIM.
Then there is a rule,
\begin{equation}
\label{eq:cause-from-prediction-2}
  [ \Vsym{down} \de \Vstr{pre} \Vsym{A} \Vstr{post} ] \in \Crules
\end{equation}
and some \Vloc{i},
some \Vstr{pre}, and
some \Vstr{post}
such that
\begin{equation}
\label{eq:cause-from-prediction-3}
\Veim{down} = \big[
  [ \Vsym{down} \de \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j}
\big]
\end{equation}
is valid.
\end{theorem}

\begin{proof}
Since
\eqref{eq:cause-from-prediction-1} is valid,
we have
\begin{equation}
\label{eq:cause-from-prediction-12}
\Vsym{A} \derives [\var{j}] \Vstr{A-rhs}.
\end{equation}
All symbols in Marpa grammars are accessible
and,
because
\eqref{eq:cause-from-prediction-1} is a prediction,
and therefore not the start EIM,
\Vsym{A} is not \Vsym{accept}.
So we can expand
\eqref{eq:cause-from-prediction-12}
to
\begin{equation}
\label{eq:cause-from-prediction-25}
\begin{split}
\Vsym{accept} \; & \destar \; \Vstr{pre2} \Vsym{down} \Vstr{post2} \\
    & \derives \; \Vstr{pre2} \Vstr{pre} \Vmk{j} \Vsym{A} \Vstr{post} \Vstr{post2} \\
    & \derives \; \Vstr{pre2} \Vstr{pre} \Vmk{j} \Vsym{A-rhs} \Vstr{post} \Vstr{post2}.
\end{split}
\end{equation}
which simplifies to
\begin{equation}
\label{eq:cause-from-prediction-30}
\Vsym{down} \derives \Vmk{i} \Vstr{pre} \Vmk{j} \Vsym{A} \Vstr{post},
\end{equation}
into which we have introduced a location
marker for \Vloc{i}.
From \eqref{eq:cause-from-prediction-30},
for the definition of EIM validity,
we have
\eqref{eq:cause-from-prediction-3}.
\eqref{eq:cause-from-prediction-3},
in turn,
shows
\eqref{eq:cause-from-prediction-2}
and the theorem.
\end{proof}

\section{Ethereal closure}

\begin{definition}
\dtitle{Ethereal closure operations}
\label{def:ethereal-closure-operations}
In the following definitions,
$\langle \Veim{down}, \Veim{effect} \rangle$
is a duple,
where \Veim{down} is a top-down cause
of \Veim{effect}:
\begin{align}
\label{def:predict-op}
\index{recce-definitions}{predict-op}
\index{recce-notation}{predict-op@\op{predict-op}{\var{eim1}, \var{eim2}}}
& \var{predict-op} \defined \left\lbrace
  \begin{gathered}
  \langle \var{down}, \var{effect} \rangle \; \text{such that}
  \\
  \text{\var{effect} is a prediction}
  \end{gathered}
\; \right\rbrace ,
\\
\label{def:null-scan-op}
\index{recce-definitions}{null-scan-op}
\index{recce-notation}{null-scan-op@\op{null-scan-op}{\var{eim1}, \var{eim2}}!as a relation}
& \var{null-scan-op} \defined \left\lbrace
  \begin{gathered}
  \langle \var{down}, \var{effect} \rangle \; \text{such that}
  \\
  \text{\var{effect} is a null-scan}
  \end{gathered}
\; \right\rbrace ,
\\
\label{def:read-op}
\index{recce-definitions}{read-op}
\index{recce-notation}{read-op@\op{read-op}{\var{eim1}, \var{eim2}}}
& \var{read-op} \defined \left\lbrace
  \begin{gathered}
  \langle \var{down}, \var{effect} \rangle \; \text{such that}
  \\
  \text{\var{effect} is a read}
  \end{gathered}
\; \right\rbrace ,
\\
\label{def:reduction-op}
\index{recce-definitions}{reduction-op}
\index{recce-notation}{reduction-op@\op{reduction-op}{\var{eim1}, \var{eim2}}}
& \var{reduction-op} \defined \left\lbrace
  \begin{gathered}
  \langle \var{down}, \var{effect} \rangle \; \text{such that}
  \\
  \text{\var{effect} is a reduction}
  \end{gathered}
\; \right\rbrace ,
\\
\label{def:epsilon-op}
\index{recce-definitions}{epsilon-op}
\index{recce-notation}{epsilon-op@\op{epsilon-op}{\var{eim1}, \var{eim2}}}
& \var{epsilon-op} \defined \var{predict-op} \cup \var{null-scan-op},
\\
\label{def:fleeting-closure}
\index{recce-definitions}{fleeting-closure}
\index{recce-notation}{fleeting-closure@\op{fleeting-closure}{\var{eim}}}
& \var{fleeting-closure} \defined \var{null-scan-op}^\ast
\; \text{and}
\\
\label{def:ethereal-closure}
\index{recce-definitions}{ethereal-closure}
\index{recce-notation}{ethereal-closure@\op{ethereal-closure}{\var{eim}}}
& \var{ethereal-closure} \defined \var{epsilon-op}^\ast.
\end{align}
\end{definition}

\begin{sloppypar}
\begin{FlushLeft}
\begin{theorem}
\ttitle{Ethereal closure properties}
\label{t:ethereal-closure}
Let \Veim{base} be a valid
EIM such that
\begin{equation}
\Veim{desc} \in \var{ethereal-closure}(\Veim{base}).
\end{equation}
Then
\begin{enumerate}
\item
\label{req:ethereal-closure-3}
$\Valid{\Veim{desc}}$
\item
\label{req:ethereal-closure-5}
$\DR{\Veim{desc}} \in \var{ethereal-dr-closure}(\DR{\Veim{base}})$,
\item
\label{req:ethereal-closure-8}
$\Current{\Veim{desc}} = \Current{\Veim{base}},$
\item
\label{req:ethereal-closure-12}
if \Veim{desc} is a quasi-prediction,
$\Left{\Veim{desc}} = \Current{\Veim{base}}$,
and
\item
\label{req:ethereal-closure-15}
if \Veim{desc} is quasi-confirmed,
then
$\Left{\Veim{desc}} = \Left{\Veim{base}}.$
\end{enumerate}
\end{theorem}
\end{FlushLeft}
\end{sloppypar}

\begin{proof}
Our proof will be by induction on the iterations
of
\var{epsilon-op}.
Let
\begin{equation}
\var{eims}[\var{i}] = \var{epsilon-op}^{\displaystyle \var{i}}(\Veim{base}).
\end{equation}

We take as our induction hypothesis:
\begin{equation}
\label{eq:ethereal-closure-18}
\myparbox{
The EIM's in $\var{eims}[\var{x}]$
obey Requirements
\ref{req:ethereal-closure-3},
\ref{req:ethereal-closure-5},
\ref{req:ethereal-closure-8},
\ref{req:ethereal-closure-12}
and
\ref{req:ethereal-closure-15}
in the statement of the theorem.
}
\end{equation}

Recall that
when we apply dotted rule notions
and functions to
an EIM, we refer to its dotted rule.
By the definition of a quasi-prediction
and of \myfnname{Dotix},
\begin{equation}
\label{eq:ethereal-closure-20}
\begin{gathered}
\text{if \Veim{qpred} is a quasi-prediction, then} \\
\var{i} < \op{Dotix}{\Veim{qpred}} \implies \RHS{\Veim{dr}, \var{i}} \derives \epsilon \quad \text{and} \\
\text{\Current{\Veim{qpred}} = \Left{\Veim{qpred}}}.
\end{gathered}
\end{equation}

\textbf{Basis}:
As the basis of the induction, we show
\eqref{eq:ethereal-closure-18}
for $\var{x} = 0$.
By the definition of an ethereal closure,
$\var{eims}[0] = \lbrace \Veim{base} \rbrace.$
By assumption for the theorem, \Veim{base} is valid.
This shows Requirement~\ref{req:ethereal-closure-3}.
Trivially, \DR{\Veim{base}} is in its own ethereal closure.
This shows Requirement~\ref{req:ethereal-closure-5}.
Also trivially, its current location is self-identical,
which shows Requirement~\ref{req:ethereal-closure-8}.

If \Veim{base} is a quasi-prediction,
then
we have
Requirement~\ref{req:ethereal-closure-12},
by self-identity and
\eqref{eq:ethereal-closure-20}.
If \Veim{base} is quasi-confirmed, we
have
Requirement~\ref{req:ethereal-closure-12}
vacuously.

If \Veim{base} is quasi-prediction,
then
we have
Requirement~\ref{req:ethereal-closure-15}
vacuously.
If \Veim{base} is quasi-confirmed, we
have
Requirement~\ref{req:ethereal-closure-15}
by self-identity.
This shows all the requirements for the basis of the induction.

\textbf{Step}:
For the step of the induction, we assume
\eqref{eq:ethereal-closure-18} for $\var{x} = \var{i}$,
to show
\eqref{eq:ethereal-closure-18} for $\var{x} = \Vincr{i}$.
We consider, without loss of generality,
just one of the dotted rules in $\var{eims}[\var{i}+1]$.
Call it \Veim{wlog2}.
By assumption for the step,
\Veim{wlog2} is not in $\var{eims}[0]$,
so that it has a top-down
cause in
$\var{eims}[\var{i}]$.
Call this top-down cause, \Veim{wlog1}.

We show Requirement~\ref{req:ethereal-closure-3}
by cases,
depending on the type of \Veim{wlog2}.
By definition of \var{ethereal-closure} for EIM's,
\Veim{wlog2} is a null-scan or a prediction.
Theorem \ref{t:prediction-from-cause}
shows that the
validity of
top-down cause \Veim{wlog1}
is sufficient to make
\Veim{wlog2} valid,
if \Veim{wlog2} is a prediction.
Theorem \ref{t:null-scan-from-down-cause}
shows that the
validity of
top-down cause \Veim{wlog1}
is sufficient to make
\Veim{wlog2} valid,
if \Veim{wlog2} is a null-scan.
We have both cases
and therefore have shown
Requirement~\ref{req:ethereal-closure-3}
for the step.

The EIM types are defined in terms of the types of their
dotted rules,
so that
\begin{gather}
\text{if $\langle \Veim{wlog1}, \Veim{wlog2} \rangle \in \var{epsilon-op},$} \\
\label{eq:ethereal-closure-27}
\text{then} \quad \big\langle \DR{\Veim{wlog1}}, \DR{\Veim{wlog2}} \big\rangle \in \var{epsilon-dr-op}.
\end{gather}
By the definition of the ethereal closure for dotted rules,
\begin{gather}
\label{eq:ethereal-closure-30}
\var{ethereal-dr-closure} = \var{epsilon-dr-op}^\ast
\end{gather}
and by assumption for the step
\begin{equation}
\label{eq:ethereal-closure-33}
\DR{\Veim{wlog1}} \in \var{ethereal-dr-closure}(\DR{\Veim{base}})
\end{equation}
Using
\eqref{eq:ethereal-closure-27},
\eqref{eq:ethereal-closure-30}
and
\eqref{eq:ethereal-closure-33},
we have
\begin{equation*}
\DR{\Veim{wlog2}} \in \var{ethereal-dr-closure}(\DR{\Veim{base}}),
\end{equation*}
which is Requirement~\ref{req:ethereal-closure-5}
for the step.

If \Veim{wlog2} is a prediction,
we know from Theorem \ref{t:prediction-from-cause}
that
\begin{equation}
\label{eq:ethereal-closure-36}
\Current{\Veim{wlog1}} = \Current{\Veim{wlog2}}
\end{equation}

If \Veim{wlog2} is a null-scan,
we know from Theorem \ref{t:right-location-of-top-down-cause}
that
\begin{align}
\Right{\Veim{wlog1}} & = \Right{\Veim{wlog2}}
\intertext{and since the right location of an EIM is also its current location,}
\label{eq:ethereal-closure-39}
\Current{\Veim{wlog1}} & = \Current{\Veim{wlog2}}
\end{align}
Also, for null-scans, we know from
Theorem
\ref{t:effect-from-symbolic-cause-pair}
that
\begin{equation}
\label{eq:ethereal-closure-42}
\Left{\Veim{wlog1}} = \Left{\Veim{wlog2}}.
\end{equation}

If \Veim{wlog2} is a quasi-prediction, we know from
\eqref{eq:ethereal-closure-20} that
\begin{equation}
\label{eq:ethereal-closure-45}
\Current{\Veim{wlog2}} = \Left{\Veim{wlog2}}.
\end{equation}

We have
\begin{equation}
\label{eq:ethereal-closure-48}
\Current{\Veim{wlog1}} = \Current{\Veim{wlog2}}
\end{equation}
from
\eqref{eq:ethereal-closure-36}
for predictions and from
\eqref{eq:ethereal-closure-39}
for null-scans.
Either way, we have
Requirement~\ref{req:ethereal-closure-8} for
the step of the induction.

We have
Requirement~\ref{req:ethereal-closure-12}
from
\eqref{eq:ethereal-closure-20} and
\eqref{eq:ethereal-closure-48}
for quasi-predictions;
and vacuously for quasi-confirmed EIM's.

We have
Requirement~\ref{req:ethereal-closure-15}
from \eqref{eq:ethereal-closure-42} for
quasi-confirmed EIM's,
and vacuously for quasi-predictions.

This shows all four requirements and,
since the choice of \Veim{wlog2} was
without loss of generality,
we have shown
\eqref{eq:ethereal-closure-18} for $\var{eims}[\var{i}+1]$.
With this,
we have shown the step of the induction,
the induction,
and the theorem.
\end{proof}

\section{Fleeting closures}

\begin{theorem}
\title{\myfnname{null-scan-op} is a function}
\label{t:null-scan-op-function}
\myfnname{null-scan-op}
and its inverse are partial functions
of the domain of valid EIM's,
and their codomain is
the set of valid EIM's.
\end{theorem}

\begin{proof}
\begin{align}
\label{eq:null-scan-op-function-10}
& \myparbox{%
\myfnname{null-scan-op}
is a relation whose domain is the valid EIM's
and whose codomain is the valid EIM's
\becuz{}
\dref[\myfnname{null-scan-op}]{def:null-scan-op}.
} \\
\label{eq:null-scan-op-function-14}
& \myparbox{%
$[ \Veim{down}, \Veim{eff} ] \in \myfnname{null-scan-op}$
if and only if two conditions hold:
\Veim{eff} is a null-scan and
\Veim{down} is the top-down cause
of \Veim{eff}
\becuz{}
\dref[\myfnname{null-scan-op}]{def:null-scan-op}.
} \\
\label{eq:null-scan-op-function-16}
& \myparbox{%
For every \Veim{down}, there is at most one
\Veim{eff}
\tref{t:null-scan-from-down-cause},
\becuz{}
\eqref{eq:null-scan-op-function-14},
\tref{t:null-scan-from-down-cause},
so that \myfnname{null-scan-op} is a function
} \\
\label{eq:null-scan-op-function-18}
& \myparbox{%
For every \Veim{eff}, there is at most one
\Veim{down}
\becuz{}
\eqref{eq:null-scan-op-function-14},
\tref{t:null-scan-from-down-cause},
so that the inverse of \myfnname{null-scan-op} is a function.
}
\end{align}
The theorem follows from
\eqref{eq:null-scan-op-function-10}
\eqref{eq:null-scan-op-function-16}
and
\eqref{eq:null-scan-op-function-18}.
\end{proof}

Based on Theorem
\tref{t:null-scan-op-function},
we will write null-scan-op,
and its inverse, as functions
so that
the relation
\[
\op{null-scan-op}{\Veim{x}, \Veim{y}}
\]
is equivalent to the functions
\begin{gather*}
\op{null-scan-op}{\Veim{x}} = \Veim{y}%
\index{recce-notation}{null-scan-op@\Vop{null-scan-op}{eim1}!as a function}
\quad \text{and}
\\
\iop{null-scan-op}{(-1)}{\Veim{y}} = \Veim{x}.%
\index{recce-notation}{null-scan-op@\Vop{null-scan-op}{eim1}!as an inverse function}
\end{gather*}

\begin{theorem}
\ttitle{\myfnname{null-scan-op} definedness}
\label{t:null-scan-op-definedness}
\myfnname{null-scan-op} is defined if and only if
the postdot symbol of its argument is nulling:
\[
\op{null-scan-op}{\Veim{cuz}} \neq \undefined
\equiv \Postdot{\Veim{cuz}} = \epsilon.
\]
Further, if \op{null-scan-op}{\Veim{e}} is defined,
then
\[
\begin{gathered}
\Rule{\Veim{e}} = \Rule{\op{null-scan-op}{\Veim{e}}}, \\
\Left{\Veim{e}} = \Left{\op{null-scan-op}{\Veim{e}}}, \\
\Right{\Veim{e}} = \Right{\op{null-scan-op}{\Veim{e}}}, \text{and} \\
\Vincr{\Dotix{\Veim{e}}} = \Dotix{\op{null-scan-op}{\Veim{e}}}.
\end{gathered}
\]
\end{theorem}

\begin{proof}
This theorem follows from
\dref[\myfnname{null-scan-op}]{def:null-scan-op},
\tref{t:null-scan-from-down-cause}
and
\tref{t:null-scan-op-function}.
\end{proof}

\begin{theorem}
\ttitle{Inverse \myfnname{null-scan-op} definedness}
\label{t:inverse-null-scan-op-definedness}
The inverse of
\myfnname{null-scan-op} is defined if and only if
the predot symbol of its argument is nulling:
\[
\iop{null-scan-op}{(-1)}{\Veim{cuz}} \neq \undefined
\equiv \Predot{\Veim{cuz}} = \epsilon.
\]
Further, if \iop{null-scan-op}{(-1)}{\Veim{e}} is defined,
then
\[
\begin{gathered}
\Rule{\Veim{e}} = \Rule{\iop{null-scan-op}{(-1)}{\Veim{e}}}, \\
\Left{\Veim{e}} = \Left{\iop{null-scan-op}{(-1)}{\Veim{e}}}, \\
\Right{\Veim{e}} = \Right{\iop{null-scan-op}{(-1)}{\Veim{e}}}, \text{and} \\
\Vdecr{\Dotix{\Veim{e}}} = \Dotix{\iop{null-scan-op}{(-1)}{\Veim{e}}}.
\end{gathered}
\]
\end{theorem}

\begin{proof}
This theorem follows from
\tref{t:null-scan-op-function}
and
\tref{t:inverse-null-scan-op-definedness}.
\end{proof}

\begin{theorem}
\ttitle{Iterated \myfnname{null-scan-op}}
\label{t:iterated-null-scan-op}
Let \Veim{bas} be a valid EIM
and
let \var{x} be an integer
such that $\var{x} \ge 0$.
Then, if
\[
\forall \; \var{i} :
\left(
\begin{gathered}
  \Dotix{\Veim{bas}} \le \var{i} < \Dotix{\Veim{bas}}+\var{x}
  \\
  \quad \implies \el{\RHS{\Veim{bas}}}{\var{i}} = \epsilon
\end{gathered}
\right),
\]
we have all of the following:
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:iterated-null-scan-op-req-1}
\Rule{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} & = \Rule{\Veim{bas}}. \\
\label{eq:iterated-null-scan-op-req-2}
\Left{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} & = \Left{\Veim{bas}}. \\
\label{eq:iterated-null-scan-op-req-3}
\Right{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} & = \Right{\Veim{bas}}. \\
\label{eq:iterated-null-scan-op-req-4}
\Dotix{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} & = \Dotix{\Veim{bas}} + \var{x}.
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
We proceed by induction.
As a preliminary, a few reminders will be useful.
First,
the value of a function iterated zero times is
the value of its argument:
\begin{equation}
\label{eq:iterated-null-scan-op-4}
\iop{null-scan-op}{0}{\Veim{bas}} = \Veim{bas}.
\end{equation}
Second,
the postdot symbol of an EIM
is the symbol on its RHS at the dot index:
\begin{equation}
\label{eq:iterated-null-scan-op-7}
\myparbox{%
$\Postdot{\Veim{e}} = (\RHS{\Veim{e}})[\Dotix{\Veim{e}}]$
\newline
\becuz{}
\dref[Postdot]{def:postdot},
\dref[Dot index]{def:dotted-rule},
\dref[DR notion refering to EIM]{def:eim-dr-notions}.
}
\end{equation}
Finally, because rule notions applied to
a dotted rule apply to its rule
\dref{def:dr-rule-notions},
we have
\begin{equation}
\label{eq:iterated-null-scan-op-8}
\RHS{\Rule{\Veim{e}}} \equiv \RHS{\Veim{e}}.
\end{equation}
In this proof,
unless clarity or emphasis suggest otherwise,
use of these reminders
will be implicit.

\textbf{Hypothesis}:
The induction hypothesis is that
\begin{subequations}
\label{eq:iterated-null-scan-op-10}
\begin{align}
\label{eq:iterated-null-scan-op-12}
& \text{if} \quad \forall \; \var{i}
\left(
\begin{gathered}
\Dotix{\Veim{bas}} \le \var{i} < \Dotix{\Veim{bas}}+\var{x}
\\
  \implies \el{\RHS{\Veim{bas}}}{\var{i}} = \epsilon
\\
\end{gathered}
\right)
\\
\notag
& \text{then we have all of the following:}
\\
\label{eq:iterated-null-scan-op-14}
& \Rule{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} = \Rule{\Veim{bas}}. \\
\label{eq:iterated-null-scan-op-16}
& \Left{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} = \Left{\Veim{bas}}. \\
\label{eq:iterated-null-scan-op-18}
& \Right{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} = \Right{\Veim{bas}}. \\
\label{eq:iterated-null-scan-op-20}
& \begin{aligned}
& \Postdot{\iop{null-scan-op}{\var{x}}{\Veim{bas}}}
\\
& \qquad = \big( \RHS{\Rule{\Veim{bas}}} \big)
	      [\Dotix{\Veim{bas}} + \var{x}].
\end{aligned}
\\
\label{eq:iterated-null-scan-op-22}
& \Dotix{\iop{null-scan-op}{\var{x}}{\Veim{bas}}} = \Dotix{\Veim{bas}} + \var{x}.
\end{align}
\end{subequations}

\textbf{Basis}:
We take as the basis \eqref{eq:iterated-null-scan-op-10}
on the assumption that
\begin{equation}
\label{eq:iterated-null-scan-op-26}
\var{x} = 0 \becuz \text{ASM for basis}.
\end{equation}
Where $\var{x} = 0$,
the antecedent of the induction hypothesis,
\eqref{eq:iterated-null-scan-op-12},
is vacuously true.
We have
\eqref{eq:iterated-null-scan-op-14}--%
\eqref{eq:iterated-null-scan-op-18}
from
\eqref{eq:iterated-null-scan-op-4}
and
\eqref{eq:iterated-null-scan-op-26}.
We have
\eqref{eq:iterated-null-scan-op-20}
from
\eqref{eq:iterated-null-scan-op-4},
\eqref{eq:iterated-null-scan-op-26}
and
\eqref{eq:iterated-null-scan-op-7}.
The last requirement to show the basis is
\eqref{eq:iterated-null-scan-op-22},
which follows from
\eqref{eq:iterated-null-scan-op-4}
and
\eqref{eq:iterated-null-scan-op-26}.

\textbf{Step}:
For the step, we assume 
\begin{equation}
\label{eq:iterated-null-scan-op-30}
\myparbox{%
the induction hypothesis \eqref{eq:iterated-null-scan-op-10}
for $\var{x} = \var{n}$,
}
\end{equation}
to show
\begin{equation}
\label{eq:iterated-null-scan-op-32}
\myparbox{%
the induction hypothesis \eqref{eq:iterated-null-scan-op-10}
for $\var{x} = \Vincr{n}$.
}
\end{equation}
The step proceeds by cases.

\textbf{Step case 1}:
For the first case of the induction step,
assume that
\begin{align}
\label{eq:iterated-null-scan-op-34}
& \myparbox{%
equation \eqref{eq:iterated-null-scan-op-12}
is false
for $\var{x} = \Vincr{n}$
\becuz{}
ASM for this case of the step.
}
\intertext{%
so that we have, vacuously, that
}
\label{eq:iterated-null-scan-op-36}
& \myparbox{%
equation \eqref{eq:iterated-null-scan-op-10}
for $\var{x} = \Vincr{n}$
\becuz{}
\eqref{eq:iterated-null-scan-op-34},
which shows the first case
of the induction step.
}
\end{align}

\textbf{Step case 2}:
For the 2nd case,
assume that
\begin{align}
\label{eq:iterated-null-scan-op-37}
& \myparbox{%
equation \eqref{eq:iterated-null-scan-op-12}
is true for 
$\var{x} = \Vincr{n}$
\becuz{}
ASM for case of step.
} \\
\label{eq:iterated-null-scan-op-38}
& \begin{aligned}
  & \forall \; \var{i}
  \left(
  \begin{aligned}
    & \Dotix{\Veim{bas}} \le \var{i} < \Dotix{\Veim{bas}}+\Vincr{n}
    \\
    & \qquad \implies \el{\RHS{\Veim{bas}}}{\var{i}} = \epsilon
    \\
  \end{aligned}
  \right)
  \\
  & \qquad \becuz
  \eqref{eq:iterated-null-scan-op-37}.
\end{aligned}
\\
\label{eq:iterated-null-scan-op-40}
& \begin{aligned}
  & \forall \; \var{i}
  \left(
  \begin{aligned}
    & \Dotix{\Veim{bas}} \le \var{i} < \Dotix{\Veim{bas}}+\var{n}
    \\
    & \qquad
      \implies \el{\RHS{\Veim{bas}}}{\var{i}} = \epsilon
    \\
  \end{aligned}
  \right)
  \\
  & \qquad \becuz
  \eqref{eq:iterated-null-scan-op-38}.
\end{aligned}
\\
\label{eq:iterated-null-scan-op-42}
& (\RHS{\Veim{bas}})[\Dotix{\Veim{bas}}+\var{n}] = \epsilon
  \becuz
  \eqref{eq:iterated-null-scan-op-38}.
\\
\label{eq:iterated-null-scan-op-44}
& \myparbox{%
Equation \eqref{eq:iterated-null-scan-op-12}
for
$\var{x} = \var{n}$
\becuz{}
\eqref{eq:iterated-null-scan-op-40}.
} \\
\label{eq:iterated-null-scan-op-46}
& \myparbox{%
\Rule{\iop{null-scan-op}{\var{n}}{\Veim{bas}}} = \Rule{\Veim{bas}}
\becuz{}
\eqref{eq:iterated-null-scan-op-30},
\eqref{eq:iterated-null-scan-op-44}.
} \\
\label{eq:iterated-null-scan-op-48}
& \myparbox{%
\Left{\iop{null-scan-op}{\var{n}}{\Veim{bas}}} = \Left{\Veim{bas}}
\becuz{}
\eqref{eq:iterated-null-scan-op-30},
\eqref{eq:iterated-null-scan-op-44}.
} \\
\label{eq:iterated-null-scan-op-50}
& \myparbox{%
\Right{\iop{null-scan-op}{\var{n}}{\Veim{bas}}} = \Right{\Veim{bas}}
\becuz{}
\eqref{eq:iterated-null-scan-op-30},
\eqref{eq:iterated-null-scan-op-44}.
} \\
\label{eq:iterated-null-scan-op-52}
& \myparbox{%
$\Postdot{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \big( \RHS{\Rule{\Veim{bas}}} \big)
	      [\Dotix{\Veim{bas}} + \var{n}]$
	      \newline
\becuz{}
\eqref{eq:iterated-null-scan-op-30},
\eqref{eq:iterated-null-scan-op-44}.
} \\
\label{eq:iterated-null-scan-op-53}
& \myparbox{%
$\Dotix{\iop{null-scan-op}{\var{n}}{\Veim{bas}}} = \Dotix{\Veim{bas}} + \var{n}$
\becuz{}
\eqref{eq:iterated-null-scan-op-30},
\eqref{eq:iterated-null-scan-op-44}.
} \\
\label{eq:iterated-null-scan-op-54}
& \myparbox{%
$\Postdot{\iop{null-scan-op}{\var{n}}{\Veim{bas}}} = \epsilon$
\becuz{}
\eqref{eq:iterated-null-scan-op-42},
\eqref{eq:iterated-null-scan-op-52}.
} \\
\label{eq:iterated-null-scan-op-55}
& \myparbox{%
$\op{null-scan-op}{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}$
\newline
\hspace*{1em} $= \iop{null-scan-op}{\Vincr{n}}{\Veim{bas}} \neq \undefined$
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-54},
\tref{t:null-scan-op-definedness}.
} \\
\label{eq:iterated-null-scan-op-56}
& \myparbox{%
$\Rule{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Rule{\op{null-scan-op}{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}}$
\newline
\hspace*{1em} $= \Rule{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$.
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-55},
\tref{t:null-scan-op-definedness}.
} \\
\label{eq:iterated-null-scan-op-58}
& \myparbox{%
$\Left{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Left{\op{null-scan-op}{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}}$
\newline
\hspace*{1em} $= \Left{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$.
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-55},
\tref{t:null-scan-op-definedness}.
} \\
\label{eq:iterated-null-scan-op-60}
& \myparbox{%
$\Right{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Right{\op{null-scan-op}{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}}$
\newline
\hspace*{1em} $= \Right{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$.
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-55},
\tref{t:null-scan-op-definedness}.
} \\
\label{eq:iterated-null-scan-op-62}
& \myparbox{%
$\incr{\Dotix{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}}$ \newline
\hspace*{1em} $= \Dotix{\op{null-scan-op}{\iop{null-scan-op}{\var{n}}{\Veim{bas}}}}$
\newline
\hspace*{1em} $= \Dotix{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$.
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-55},
\tref{t:null-scan-op-definedness}.
} \\
\label{eq:iterated-null-scan-op-64}
& \myparbox{%
$\Rule{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Rule{\Veim{bas}}.$
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-46},
\eqref{eq:iterated-null-scan-op-56},
which is requirement
\eqref{eq:iterated-null-scan-op-14}
for this case of the step.
} \\
\label{eq:iterated-null-scan-op-66}
& \myparbox{%
$\Left{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Left{\Veim{bas}}.$
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-48},
\eqref{eq:iterated-null-scan-op-58},
which is requirement
\eqref{eq:iterated-null-scan-op-16}
for this case of the step.
} \\
\label{eq:iterated-null-scan-op-68}
& \myparbox{%
$\Right{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Right{\Veim{bas}}.$
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-50},
\eqref{eq:iterated-null-scan-op-60},
which is requirement
\eqref{eq:iterated-null-scan-op-18}
for this case of the step.
} \\
\label{eq:iterated-null-scan-op-70}
& \myparbox{%
$\Dotix{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}$ \newline
\hspace*{1em} $= \Dotix{\Veim{bas}} + \var{n} + 1.$
\newline
\becuz{}
\eqref{eq:iterated-null-scan-op-53},
\eqref{eq:iterated-null-scan-op-62},
which is requirement
\eqref{eq:iterated-null-scan-op-22}
for this case of the step.
} \\
\label{eq:iterated-null-scan-op-72}
& \myparbox{%
\Postdot{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}
\newline
\hspace*{1em}
$= (\RHS{
  \iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}
})[$
\newline
\hspace*{2em}
  \Dotix{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}
\newline
\hspace*{1em}
$]$,
\becuz{}
\eqref{eq:iterated-null-scan-op-7},
\eqref{eq:iterated-null-scan-op-55},
\tref{t:null-scan-op-definedness}.
} \\
\label{eq:iterated-null-scan-op-74}
& \myparbox{%
\Postdot{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}
\newline
\hspace*{1em}
$= (\RHS{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}})[$
\newline
\hspace*{2em}
  $\Dotix{\Veim{bas}} + \var{n} + 1$
\newline
\hspace*{1em}
$]$,
\becuz{}
\eqref{eq:iterated-null-scan-op-70},
\eqref{eq:iterated-null-scan-op-72}.
} \\
\label{eq:iterated-null-scan-op-76}
& \myparbox{%
\Postdot{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}
\newline
\hspace*{1em}
$= (\RHS{\Rule{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}})[$
\newline
\hspace*{2em}
  $\Dotix{\Veim{bas}} + \var{n} + 1$
\newline
\hspace*{1em}
$]$,
\becuz{}
\eqref{eq:iterated-null-scan-op-74},
\dref[rule notions applied to EIM's]{def:eim-rule-notions}.
} \\
\label{eq:iterated-null-scan-op-78}
& \myparbox{%
\Postdot{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}
\newline
\hspace*{1em}
$= (\RHS{\Rule{\Veim{bas}}})[$
\newline
\hspace*{2em}
  $\Dotix{\Veim{bas}} + \var{n} + 1$
\newline
\hspace*{1em}
$]$,
\becuz{}
\eqref{eq:iterated-null-scan-op-64},
\eqref{eq:iterated-null-scan-op-76}.
} \\
\label{eq:iterated-null-scan-op-80}
& \myparbox{%
\Postdot{\iop{null-scan-op}{\Vincr{n}}{\Veim{bas}}}
\newline
\hspace*{1em}
  $= (\RHS{\Veim{bas}})[ \Dotix{\Veim{bas}} + \var{n} + 1 ]$,
\newline
\hspace*{1em}
\becuz{}
\eqref{eq:iterated-null-scan-op-78},
\dref[rule notions applied to EIM's]{def:eim-rule-notions},
which is requirement
\eqref{eq:iterated-null-scan-op-20}
for this case of the step.
} \\
\label{eq:iterated-null-scan-op-82}
& \myparbox{%
Equation \eqref{eq:iterated-null-scan-op-10}
for $\var{x} = \Vincr{n}$
\becuz{}
\eqref{eq:iterated-null-scan-op-64},
\eqref{eq:iterated-null-scan-op-66},
\eqref{eq:iterated-null-scan-op-68},
\eqref{eq:iterated-null-scan-op-70},
\eqref{eq:iterated-null-scan-op-80},
which shows the second case
of the induction step.
}
\end{align}

Equations
\eqref{eq:iterated-null-scan-op-36}
and
\eqref{eq:iterated-null-scan-op-82}
show both cases of the induction step,
and therefore the induction step.
From the induction step, we have
\begin{equation}
\label{eq:iterated-null-scan-op-84}
\myparbox{the induction hypothesis
  \eqref{eq:iterated-null-scan-op-10}
  for all $\var{x} \ge 0$.
}
\end{equation}
Note that,
in \eqref{eq:iterated-null-scan-op-84},
where $\var{x} > \Vlastix{\RHS{\Veim{bas}}}$,
then 
$(\RHS{\Veim{bas}})[\var{x}] = \undefined$,
so that we have
\eqref{eq:iterated-null-scan-op-10} vacuously.
The theorem follows directly from
\eqref{eq:iterated-null-scan-op-84}.
\end{proof}

TODO: TOHERE

\begin{theorem}
\ttitle{Iterated \myfnname{null-scan-op} and nulls}
\label{t:iterated-null-scan-op-and-nulls}
Let \iop{null-scan-op}{\var{n}}{\Veim{e}} be
defined for some valid \Veim{e}.
Then
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:iterated-null-scan-op-and-nulls-req-10}
& \myparbox{%
$\forall \; \var{i} : (0 \le \var{i} < \var{n})$
\newline
\hspace*{2em} $\implies \Postdot{\iop{null-scan-op}{\var{i}}{\Veim{e}}} = \epsilon$.
}
\\
\label{eq:iterated-null-scan-op-and-nulls-req-12}
& \myparbox{%
$\forall \; \var{i} : (0 < \var{i} \le \var{n})$
\newline
\hspace*{2em} $\implies \Predot{\iop{null-scan-op}{\var{i}}{\Veim{e}}} = \epsilon$.
}
\\
\label{eq:iterated-null-scan-op-and-nulls-req-14}
& \myparbox{%
    If $\var{r} = \Rule{\iop{null-scan-op}{\var{i}}{\Veim{e}}}$
    for any
    $0 \le \var{j} \le \var{n}$, then
    \newline
  \hspace*{1em} $\RHS{\var{r}} \big[
    \Dotix{\el{pfs}{0}} \ldots \Dotix{\el{pfs}{\Vdecr{n}}}
  \big] = \epsilon$.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
TODO

\myparbox{%
$\forall \var{i} : 0 < \var{i} \le \var{n}$ \newline
\hspace*{1em} $\implies (\Predot{\iop{null-scan-op}{\var{n}}{\Veim{e}}}$ \newline
\hspace*{3em} $= \Postdot{\iop{null-scan-op}{(\Vdecr{n})}{\Veim{e}}})$ \newline
\becuz{}
\dref[Predot]{def:predot},
\dref[Postdot]{def:postdot},
\dref[\myfnname{null-scan-op}]{def:null-scan-op},
\tref{t:null-scan-from-down-cause}
and
\tref{t:null-scan-op-function}.
}

\myparbox{%
TODO: fix \newline
$\forall \var{i} : 0 \le \var{i} < \var{n}$ \newline
\hspace*{1em} $\implies ( \Postdot{\iop{null-scan-op}{\var{n}}{\Veim{e}}}$ \newline
\hspace*{3em} $= \el{rhs}{\Dotix{\iop{null-scan-op}{\var{n}}{\Veim{e}}}})$
\newline
\becuz{}
\dref[Postdot]{def:postdot},
\dref[Dot index]{def:dotted-rule},
\dref[DR notion refering to EIM]{def:eim-dr-notions}.
}

\myparbox{%
\iop{null-scan-op}{\var{n}}{\Veim{e}} is defined
\becuz{}
ASM for this theorem.
}

\myparbox{%
$\forall \var{i} : 0 \le \var{i} \le \var{n}$ \newline
\hspace*{1em} $\implies \iop{null-scan-op}{\var{i}}{\Veim{e}}$ are defined
\newline
\becuz{}
ASM for this theorem.
}

\myparbox{%
$\forall \var{i} : 0 < \var{i} \le \var{n}$ \newline
\hspace*{1em} $\implies \iop{null-scan-op}{\var{i}}{\Veim{e}}$ \newline
\hspace*{3em} $= \op{null-scan-op}{\iop{null-scan-op}{(\Vdecr{i})}{\Veim{e}}}$.
\newline
\becuz{}
definition of an iterated function.
}

\myparbox{%
$\forall \var{i} : 0 \le \var{i} < \var{n}$ \newline
\hspace*{1em} $\implies \Postdot{\iop{null-scan-op}{\var{i}}{\Veim{e}}} = \epsilon$ \newline
\becuz{}
TODO,
\tref{t:null-scan-op-definedness}.
}


TODO: finish

\end{proof}

\begin{definition}
\dtitle{Partial fleeting sequence}
\label{def:partial-fleeting-sequence}
Let \var{pfs} be a sequence.
We define the
\dfn{partial fleeting sequence}%
\index{recce-definitions}{fleeting sequence@fleeting sequence!partial}
of an valid EIM, call it \Veim{e},
as a sequence, call it \var{pfs},
such that for all $\var{i} > 0$,
if \iop{null-scan-op}{\var{i}}{\Veim{e}}) is defined,
then
\[
   \Vel{pfs}{i} = \iop{null-scan-op}{\var{i}}{\Veim{e}}.
\]
Note the special case where
\[
   \el{pfs}{0} = \iop{null-scan-op}{0}{\Veim{e}} = \Veim{e}.
\]
\end{definition}

\begin{theorem}
\ttitle{Partial fleeting sequence is consecutive}
\label{t:partial-fleeting-sequence-contiguous}
Let \var{fc} be the fleeting closure of \Veim{bas},
and let \var{pfs} be its partial fleeting sequence.
Then the sequence \var{pfs} is contiguous,
starting at 0.
\end{theorem}

\begin{proof}
From 
\dref[partial fleeting sequence]{def:partial-fleeting-sequence},
it can be seen directly that the indexes of \var{pfs} are iterations
of a function, and therefore non-negative.
It can also be seen directly from
\dref{def:partial-fleeting-sequence} that $\el{pfs}{0} = \Veim{bas}$,
so that there is a zero'th element of \var{pfs}.

It remains to show that the elements of \var{pfs} are contiguous.
We assume for a reductio that
\begin{align}
\label{eq:partial-fleeting-sequence-contiguous-20}
& \myparbox{%
\var{pfs} contains at least one non-contiguous element
\becuz{}
ASM for reductio.
Let the first non-contiguous element be \Vel{pfs}{j}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-20-5}
& \myparbox{%
$\var{j} > 0$ \becuz{}
an element at index 0 is always contiguous.
} \\
\label{eq:partial-fleeting-sequence-contiguous-21-1}
& \myparbox{%
\Vel{pfs}{j} is defined.
\becuz{}
\eqref{eq:partial-fleeting-sequence-contiguous-20}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-21-2}
& \myparbox{%
\el{pfs}{\Vdecr{j}} is not defined.
\becuz{}
\eqref{eq:partial-fleeting-sequence-contiguous-20}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-24}
& \myparbox{%
\Vel{pfs}{j} = \op{null-scan-op}{\iop{null-scan-op}{(\Vdecr{j})}{\Veim{bas}}}
\becuz{}
\dref[partial fleeting sequence]{def:partial-fleeting-sequence},
\eqref{eq:partial-fleeting-sequence-contiguous-20-5},
\eqref{eq:partial-fleeting-sequence-contiguous-21-1}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-26}
& \myparbox{%
If \op{null-scan-op}{\var{x}} is well-defined,
then \var{x} is a valid EIM
\becuz{}
\tref{t:null-scan-op-function}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-28}
& \myparbox{%
\iop{null-scan-op}{(\Vdecr{j})}{\Veim{bas}}
is a valid EIM
\becuz{}
\eqref{eq:partial-fleeting-sequence-contiguous-21-1},
\eqref{eq:partial-fleeting-sequence-contiguous-24},
\eqref{eq:partial-fleeting-sequence-contiguous-26}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-30}
& \myparbox{%
$\el{pfs}{\Vdecr{j}} = \iop{null-scan-op}{(\Vdecr{j})}{\Veim{bas}}$
\becuz{}
\dref[partial fleeting sequence]{def:partial-fleeting-sequence}.
} \\
\label{eq:partial-fleeting-sequence-contiguous-32}
& \myparbox{%
\el{pfs}{\Vdecr{j}} is defined.
\becuz{}
\eqref{eq:partial-fleeting-sequence-contiguous-28},
\eqref{eq:partial-fleeting-sequence-contiguous-30},
which contradicts
\eqref{eq:partial-fleeting-sequence-contiguous-21-2}
and shows the reductio.
}
\end{align}

From the reductio of
\eqref{eq:partial-fleeting-sequence-contiguous-20}--%
\eqref{eq:partial-fleeting-sequence-contiguous-32},
we conclude that \var{pfs} is contiguous.
\end{proof}

\begin{theorem}
\ttitle{Partial fleeting sequence}
\label{t:partial-fleeting-sequence}
Let \var{fc} be the fleeting closure of \Veim{bas},
and let \var{pfs} be its partial fleeting sequence.
Then the sequence \var{pfs} contains all and only
the elements of \var{fc}.
\end{theorem}

\begin{proof}
\begin{align}
\label{eq:partial-fleeting-sequence-20}
& \myparbox{%
\var{fc} is the reflexive and transitive closure of \myfnname{null-scan-op}
\becuz{} \dref[fleeting closure]{def:fleeting-closure}. 
} \\
\label{eq:partial-fleeting-sequence-21}
& \myparbox{%
$\forall \; \Veim{e} : \Veim{e} \in \var{pfs} \implies
\Veim{e} \in \var{fc}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-20},
and directly from
\dref[partial fleeting sequence]{def:partial-fleeting-sequence}.
} \\
\label{eq:partial-fleeting-sequence-22}
& \myparbox{%
$\forall \; \Veim{e} :
\Veim{e} \in \var{fc} \implies
\exists \var{i} : 
\iop{null-scan-op}{\var{i}}{\Veim{bas}} = \Veim{e}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-20}.
} \\
\label{eq:partial-fleeting-sequence-24}
& \myparbox{%
$\forall \; \Veim{e} :
\Veim{e} \in \var{fc} \implies
\exists \var{i} : 
\Vel{pfs}{i} = \Veim{e}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-22},
\dref[partial fleeting sequence]{def:partial-fleeting-sequence}.
} \\
\label{eq:partial-fleeting-sequence-26}
& \myparbox{%
$\forall \; \Veim{e} : \Veim{e} \in \var{fc} \implies
\Veim{e} \in \var{pfs}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-24}.
} \\
\label{eq:partial-fleeting-sequence-29}
& \myparbox{%
$\forall \; \Veim{e} : \Veim{e} \in \var{fc} \equiv
\Veim{e} \in \var{pfs}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-22},
\eqref{eq:partial-fleeting-sequence-26},
which shows the theorem.
\qedhere
}
\end{align}
\end{proof}

\begin{theorem}
\ttitle{Partial fleeting sequence is unique}
\label{t:partial-fleeting-sequence-uniq}
Let \Veim{bas} be a valid EIM.
The partial fleeting sequence of \Veim{bas} is unique.
\end{theorem}

\begin{proof}
The proof is by reductio.
\begin{align}
\label{eq:partial-fleeting-sequence-uniq-10}
\myparbox{%
\var{pfs1} and \var{pfs2} are partial fleeting sequences
of \Veim{bas},
and $\var{pfs1} \neq \var{pfs2}$
\becuz{}
ASM for reductio.
} \\
\label{eq:partial-fleeting-sequence-uniq-12}
\myparbox{%
There is at least one index, \var{ix}, such that
$\Vel{pfs1}{ix} \neq \Vel{pfs2}{ix}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-uniq-10}.
} \\
\label{eq:partial-fleeting-sequence-uniq-14}
\myparbox{%
There is a first index, \var{ix1}, such that
$\Vel{pfs1}{ix1} \neq \Vel{pfs2}{ix1}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-uniq-12}.
} \\
\label{eq:partial-fleeting-sequence-uniq-16}
\myparbox{%
$\Vel{pfs1}{ix1} = \iop{null-scan-op}{(\var{ix1})}{\Veim{bas}}$
\becuz{}
\dref[partial fleeting sequence]{def:partial-fleeting-sequence}.
} \\
\label{eq:partial-fleeting-sequence-uniq-18}
\myparbox{%
$\Vel{pfs2}{ix1} = \iop{null-scan-op}{(\var{ix1})}{\Veim{bas}}$
\becuz{}
\dref{def:partial-fleeting-sequence}.
} \\
\label{eq:partial-fleeting-sequence-uniq-20}
\myparbox{%
$\Vel{pfs1}{ix1} = \Vel{pfs2}{ix1}$
\becuz{}
\eqref{eq:partial-fleeting-sequence-uniq-16},
\eqref{eq:partial-fleeting-sequence-uniq-18},
which shows the reductio.
}
\end{align}

From the reductio,
we conclude that
\var{pfs1} = \var{pfs2}.
\end{proof}

\begin{theorem}
Let \var{pfs} be the partial fleeting sequence
of \Veim{bas}.
\begin{align}
\label{eq:partial-fleeting-sequence-properties-req-27}
& \forall \; \var{i} : (0 \le \var{i} < \Vlastix{pfs})
  \implies \Postdot{\Vel{pfs}{i}} = \epsilon.
\\
\label{eq:partial-fleeting-sequence-properties-req-28}
& \myparbox{%
    If $\var{r} = \Rule{\Vel{pfs}{i}}$
    for any
    $0 \le \var{i} \le \Vlastix{pfs}$, then
    \newline
  \hspace*{2em} $\RHS{\var{r}} \big[
    \Dotix{\el{pfs}{0}} \ldots \Dotix{\el{pfs}{\Vlastix{pfs}}}
  \big] = \epsilon$.
}
\end{align}
\end{theorem}

\begin{proof}

$\forall \; \var{i} : (0 < \var{i} \le \Vlastix{pfs})
\implies (\exists \Veim{e} :
\Vel{pfs}{i} = \Vop{null-scan-op}{\iop{null-scan-op}{(Vdecr{i})}{\Veim{e}}}
$
\becuz{}
TODO

TODO
\end{proof}

\begin{theorem}
\ttitle{Length of partial fleeting sequence}
\label{t:partial-fleeting-sequence-length}
The length of a partial fleeting sequence is
\begin{itemize}
\item
less than or equal to \Vincr{nulrun},
where \var{nulrun} is
the longest consecutive run of nulling
symbols on the RHS of a rule;
\item
less that or equal to the length of the longest rule; and
\item
\order{c}, where \var{c} is a constant
which depends on the grammar.
\end{itemize}
\end{theorem}

\begin{proof}
TODO
\end{proof}

TODO: TOHERE

TODO: [
New terminology: \newline
``partial fleeting sequence'' is fleeting closure as a sequence \newline
``fleeting sequence'' == ``maximal fleeting sequence'' \newline
``fleeting sequence'' was PREVIOUSLY maximal fleeting closure \newline
``fleeting silo'' == PREVIOUS quasi-complete fleeting closure \newline
Later, prove that ``fleeting silo'' is in fact a silo \newline
]

\begin{theorem}
\ttitle{Partial fleeting sequence properties}
\label{t:partial-fleeting-sequence-properties}
Let \var{pfs} be a partial fleeting sequence.
Then the following hold:
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:partial-fleeting-sequence-properties-req-20}
& \begin{aligned}
  & \forall \; \var{i}, \var{j} : (0 \le \var{i} \le \Vlastix{pfs} \land 0 \le \var{j} \le \Vlastix{pfs})
  \\
  & \qquad \implies \Rule{\Vel{pfs}{i}} = \Rule{\Vel{pfs}{j}}.
  \end{aligned}
\\[0.5ex]
\label{eq:partial-fleeting-sequence-properties-req-22}
& \begin{aligned}
  & \forall \; \var{i}, \var{j} : (0 \le \var{i} \le \Vlastix{pfs} \land 0 \le \var{j} \le \Vlastix{pfs})
  \\
  & \qquad \implies \Left{\Vel{pfs}{i}} = \Left{\Vel{pfs}{j}}.
  \end{aligned}
\\[0.5ex]
\label{eq:partial-fleeting-sequence-properties-req-24}
& \begin{aligned}
  & \forall \; \var{i}, \var{j} : (0 \le \var{i} \le \Vlastix{pfs} \land 0 \le \var{j} \le \Vlastix{pfs})
  \\
  & \qquad \implies \Right{\Vel{pfs}{i}} = \Right{\Vel{pfs}{j}}.
  \end{aligned}
\\[0.5ex]
\label{eq:partial-fleeting-sequence-properties-req-26}
& \begin{aligned}
  & \forall \; \var{i} : (0 \le \var{i} < \Vlastix{pfs})
  \\
  & \qquad \implies \Vincr{\Dotix{\Vel{pfs}{i}}} = \Dotix{\el{pfs}{\Vincr{i}}}.
  \end{aligned}
\\[0.5ex]
\label{eq:partial-fleeting-sequence-properties-req-30-1}
& \myparbox{%
  For every \var{i} such that
  $0 \le \var{i} < \Vlastix{pfs}$,
  \Vel{pfs}{i} is never the bottom-up cause of any effect.
} \\
\label{eq:partial-fleeting-sequence-properties-req-30-2}
& \myparbox{%
  For every \var{i} such that
  $0 \le \var{i} < \Vlastix{pfs}$,
  \Vel{pfs}{i} is the only top-down cause of
  \el{pfs}{\Vincr{i}}.
} \\
\label{eq:partial-fleeting-sequence-properties-req-30-3}
& \myparbox{%
  For every \var{i} such that
  $0 \le \var{i} < \Vlastix{pfs}$,
  \el{pfs}{\Vincr{i}} is the only effect of
  \Vel{pfs}{i}.
} \\
\label{eq:partial-fleeting-sequence-properties-req-30-4}
& \myparbox{%
  For every \var{i} such that
  $0 \le \var{i} < \Vlastix{pfs}$,
  \el{pfs}{\Vincr{i}} is the only effect of
  the cause-pair $[\Vel{pfs}{i}, \Vinst{nul}]$,
  where \Vinst{nul} is such that \newline
   \hspace*{2em} $\Symbol{\Vinst{nul}} = \Postdot{\Vel{pfs}{i}} = \epsilon$, \newline
    \hspace*{2em} $\Left{\Vinst{nul}} = \Right{\Vel{pfs}{i}},$ and \newline
    \hspace*{2em} $\Right{\Vinst{nul}} = \Right{\Vel{pfs}{i}}.$
} \\
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
TODO.
\end{proof}

TODO: TOHERE

Recall that when we apply dotted rule notions to EIM's
we mean to apply them to the dotted rule of the EIM
\dref{def:eim-dr-notions}.
The following definition makes explicit a specific case
of \dref{def:eim-dr-notions}.

\begin{definition}
\dtitle{Lasting and fleeting bases}
\label{lasting-and-fleeting-bases}
A
\xdfn{lasting base}{lasting base!EIM}
EIM
is an EIM
whose dotted rule is a lasting base.
Any EIM which is not a lasting base
is a
\xdfn{fleeting base}{fleeting base!EIM}.
\end{definition}

TODO:TOHERE

\begin{theorem}
\ttitle{Null scan arithmetic}
\label{t:null-scan-arithmetic}
If \var{fc} is the fleeting closure of \Veim{eim},
and
$0 \le \var{i} \le \Vlastix{fc}$,
then
\[
 \Vel{fc}{i} = \left[
\begin{gathered}
  [
\Rule{\Veim{eim}}, (\Dotix{\Veim{eim}} + \var{i}) ], \\
  \Left{\Veim{eim}},
  \Current{\Veim{eim}},
\end{gathered}
\right]
\]
\end{theorem}

\begin{proof}
Let, without loss of generality,
\begin{gather*}
\el{fc}{0} = \big[ [ \Vrule{r}, \var{lo} ], \var{i}, \var{k} \big]
  \quad \text{and} \\
\var{hi} = \var{lo} + \Vlastix{fc}.
\end{gather*}
By the definition of a fleeting closure
and the definition of \myfnname{null-scan-op},
we have
\begin{align*}
& \forall \; \var{a} : \var{lo} \le \var{a} < \var{hi}
   \implies \Vop{RHS}{\Vrule{r}, \var{a}} = \epsilon
\intertext{so that}
& \forall \; \var{i} : 0 \le \var{i} \le \xxsubtract{\var{hi}}{\var{lo}}
\\
& \qquad \qquad \implies \left(
\el{ns}{\var{i}} =
\big[ [ \Vrule{r}, \var{lo}+\var{i} ], \var{i}, \var{k} \big]
\right).
\qedhere
\end{align*}
\end{proof}

\begin{theorem}
\ttitle{Fleeting closure shared properties}
\label{t:fleeting-closure-shared-properties}
Let \var{fc} be a fleeting closure,
and let \Veim{e1} and \Veim{e2} be two EIM's
such that
 $\Veim{e1} \in \var{fc}$
 and $\Veim{e2} \in \var{fc}$.
Then
\begin{align*}
    \Rule{\Veim{e1}} & = \Rule{\Veim{e2}}, \\
    \Left{\Veim{e1}} & = \Left{\Veim{e2}}, \text{and} \\
    \Right{\Veim{e1}} & = \Right{\Veim{e2}}.
\end{align*}
\end{theorem}

\begin{proof}
This theorem follows directly from
\tref{t:null-scan-arithmetic}.
\end{proof}

\begin{theorem}
\ttitle{Fleeting closure shares quasi-completeness}
\label{t:fleeting-closure-shares-quasi-completeness}
Let \var{fc} be a fleeting closure,
and let \Veim{q} and \Veim{e} be two EIM's,
such that
\begin{align}
\label{eq:fleeting-closure-shares-quasi-completeness-10}
& \text{\Veim{q} is quasi-complete}, \\
\label{eq:fleeting-closure-shares-quasi-completeness-12}
& \text{$\Veim{q} \in \var{fc}$ and} \\
\label{eq:fleeting-closure-shares-quasi-completeness-14}
& \Veim{e} \in \var{fc}.
\end{align}
Then \Veim{e} is also quasi-complete.
\end{theorem}

\begin{proof}
\Veim{q} and \Veim{e} share the same 
rule
\tref{t:fleeting-closure-shared-properties},
\eqref{eq:fleeting-closure-shares-quasi-completeness-12},
\eqref{eq:fleeting-closure-shares-quasi-completeness-14}.
Call this rule, \Vrule{r}.  Then

\begin{align}
\label{eq:fleeting-closure-shares-quasi-completeness-20}
& \begin{aligned}
  & \forall \; \var{a} : \Dotix{\Veim{q}} \le \var{a} < \Vsize{\Vrule{r}} \\
  & \qquad \implies \RHS{\Vrule{r}, \var{a}} = \epsilon \\
  & \qquad \qquad \becuz{}
  \eqref{eq:fleeting-closure-shares-quasi-completeness-10},
  \dref[quasi-complete EIM]{def:eim-dr-notions}.
\end{aligned}
\\
\label{eq:fleeting-closure-shares-quasi-completeness-22}
& \begin{aligned}
  & \forall \; \var{a} : \Dotix{\el{fc}{0}} \le \var{a} \le \Dotix{\el{fc}{\Vlastix{fc}}} \\
  & \qquad \implies \RHS{\Vrule{r}, \var{a}} = \epsilon \\
  & \qquad \qquad \becuz
    \dref[fleeting closure]{def:fleeting-closure-sequence}.
\end{aligned}
\\
\label{eq:fleeting-closure-shares-quasi-completeness-24}
& \begin{aligned}
& \Dotix{\el{fc}{0}} < \Dotix{\Veim{e}} \\
& \qquad \qquad \becuz \Veim{e} \in \var{fx}.
\end{aligned}
\\
\label{eq:fleeting-closure-shares-quasi-completeness-26}
& \begin{aligned}
  & \forall \; \var{a} : \Dotix{\el{fc}{0}} \le \var{a} < \Vsize{\Vrule{r}} \\
  & \qquad \implies \RHS{\Vrule{r}, \var{a}} = \epsilon \\
  & \qquad \qquad \becuz{}
  \eqref{eq:fleeting-closure-shares-quasi-completeness-20},
  \eqref{eq:fleeting-closure-shares-quasi-completeness-22},
  \eqref{eq:fleeting-closure-shares-quasi-completeness-24}.
\end{aligned}
\\
\label{eq:fleeting-closure-shares-quasi-completeness-28}
& \begin{aligned}
  & \forall \; \var{i} : 0 \le \var{i} \le \Vlastix{fc} \\
  & \qquad \implies \Dotix{\el{fc}{0}} \le \Dotix{\Vel{fc}{i}} \\
  & \qquad \qquad \becuz \tref{t:null-scan-arithmetic}.
\end{aligned}
\\
\label{eq:fleeting-closure-shares-quasi-completeness-30}
& \begin{aligned}
  & \forall \; \var{i}, \var{a} :
  \left(
  \begin{gathered}
    0 \le \var{i} \le \Vlastix{fc} \; \text{and} \\
    \Dotix{\Vel{fc}{i}} \le \var{a} < \Vsize{\Vrule{r}}
  \end{gathered}
  \right) \\
  & \qquad \implies \RHS{\Vrule{r}, \var{a}} = \epsilon \\
  & \qquad \qquad \becuz
    \eqref{eq:fleeting-closure-shares-quasi-completeness-26},
    \eqref{eq:fleeting-closure-shares-quasi-completeness-28}.
\end{aligned}
\\
\label{eq:fleeting-closure-shares-quasi-completeness-32}
& \begin{aligned}
  & \forall \; \var{i} : 0 \le \var{i} \le \Vlastix{fc} \\
  & \qquad \implies \text{\Vel{fc}{i} is quasi-complete} \\
  & \qquad \qquad \becuz
    \dref[quasi-complete EIM]{def:eim-dr-notions},
    \eqref{eq:fleeting-closure-shares-quasi-completeness-30}.
    \qedhere
\end{aligned}
\end{align}
\end{proof}

\begin{theorem}
\ttitle{Fleeting closure shares EIM completion}
\label{t:fc-shares-eim-completion}
Let \Veim{e1} and \Veim{e2} be two
quasi-complete EIM's
in the same fleeting closure.
Let \Veim{comp1} be the EIM completion of \Veim{e1}
and let \Veim{comp1} be the EIM completion of \Veim{e2}.
Then $\Veim{comp1} = \Veim{comp2}$.
\end{theorem}

\begin{proof}
Let \var{fc} be a fleeting closure such that
\begin{align}
\label{eq:fc-shares-eim-completion-10}
& \Veim{e1} \in \var{fc}
\becuz \text{ASM for this theorem} \; \text{and}
\\
\label{eq:fc-shares-eim-completion-12}
& \Veim{e2} \in \var{fc}
\becuz \text{ASM for this theorem}.
\\
\label{eq:fc-shares-eim-completion-14}
& \myparbox{%
\Veim{comp1} is the EIM completion of \Veim{e1}
\becuz{} ASM for this theorem.
} \\
\label{eq:fc-shares-eim-completion-16}
& \myparbox{%
\Veim{comp2} is the EIM completion of \Veim{e2}
\becuz{} ASM for this theorem.
} \\
%
\label{eq:fc-shares-eim-completion-18}
& \Rule{\Veim{e1}} = \Rule{\Veim{e2}}
\becuz
\eqref{eq:fc-shares-eim-completion-10},
\eqref{eq:fc-shares-eim-completion-12},
\tref{t:fleeting-closure-shared-properties}.
\\
\label{eq:fc-shares-eim-completion-20}
& \myparbox{%
$\Rule{\Veim{comp1}} = \Rule{\Veim{e1}}$
\becuz
\eqref{eq:fc-shares-eim-completion-14},
\dref[completion EIM of an EIM]{def:eim-dr-notions}.
} \\
\label{eq:fc-shares-eim-completion-22}
& \myparbox{%
$\Rule{\Veim{comp2}} = \Rule{\Veim{e2}}$
\becuz
\eqref{eq:fc-shares-eim-completion-16},
\dref{def:eim-dr-notions}.
} \\
\label{eq:fc-shares-eim-completion-23}
& \Rule{\Veim{comp1}} = \Rule{\Veim{comp2}}
\becuz
\eqref{eq:fc-shares-eim-completion-20},
\eqref{eq:fc-shares-eim-completion-22}.
\\
\label{eq:fc-shares-eim-completion-24}
& \myparbox{%
$\Dotix{\Veim{comp1}} = \Vsize{\Rule{\Veim{e1}}}$
\becuz
\eqref{eq:fc-shares-eim-completion-14},
\dref[completion EIM of an EIM]{def:eim-dr-notions}.
} \\
\label{eq:fc-shares-eim-completion-26}
& \myparbox{%
$\Dotix{\Veim{comp2}} = \Vsize{\Rule{\Veim{e2}}}$
\becuz
\eqref{eq:fc-shares-eim-completion-16},
\dref{def:eim-dr-notions}.
} \\
\label{eq:fc-shares-eim-completion-28}
& \Dotix{\Veim{comp1}} = \Dotix{\Veim{comp2}}
\becuz
\eqref{eq:fc-shares-eim-completion-24},
\eqref{eq:fc-shares-eim-completion-26}.
\\
\label{eq:fc-shares-eim-completion-30}
& \DR{\Veim{e1}} = \DR{\Veim{e2}}
\becuz
\eqref{eq:fc-shares-eim-completion-23},
\eqref{eq:fc-shares-eim-completion-28}.
\\
%
\label{eq:fc-shares-eim-completion-32}
& \Left{\Veim{e1}} = \Left{\Veim{e2}}
\becuz
\eqref{eq:fc-shares-eim-completion-10},
\eqref{eq:fc-shares-eim-completion-12},
\tref{t:fleeting-closure-shared-properties}.
\\
\label{eq:fc-shares-eim-completion-34}
& \myparbox{%
\Right{\Veim{e1}} = \Right{\Veim{e2}}
\becuz
\eqref{eq:fc-shares-eim-completion-10},
\eqref{eq:fc-shares-eim-completion-12},
\tref{t:fleeting-closure-shared-properties}.
} \\
\label{eq:fc-shares-eim-completion-36}
& \Veim{comp1} = \Veim{comp2}
\becuz 
\eqref{eq:fc-shares-eim-completion-30},
\eqref{eq:fc-shares-eim-completion-32},
\eqref{eq:fc-shares-eim-completion-34}.
\qedhere
\end{align}
\end{proof}

\begin{theorem}
\ttitle{EIM lasting base}
\label{t:eim-lasting-base}
Every valid EIM has exactly one valid lasting base,
and every valid EIM is in the
fleeting closure of its lasting base.
\end{theorem}

\begin{proof}
Let \Veim{eim} be a valid EIM,
and \Veim{bas} its lasting base.
By the definition of a lasting base for an EIM,
\begin{equation}
\label{eq:eim-lasting-base-23}
\begin{aligned}
& \forall \; \var{a} : \Dotix{\Veim{bas}} \le \var{a} < \Dotix{\Veim{eim}} \\
& \qquad \implies \RHS{\Veim{eim}, \var{a}} = \epsilon
\end{aligned}
\end{equation}
and
\begin{equation}
\Dotix{\Veim{bas}} = 0 \; \lor \; \Predot{\Veim{bas}} \neq \epsilon.
\end{equation}

If
$\Dotix{\Veim{eim}} = 0$ or $\Predot{\Veim{eim}} \neq \epsilon$,
we know that \Veim{eim} is its own lasting base:
$\Veim{bas} = \Veim{eim}$.
And, since
\begin{equation}
\label{eq:eim-lasting-base-25}
\myfnname{null-scan-op}^{\displaystyle (0)}(\Veim{bas}) = \Veim{eim}
\end{equation}
we also know that \Veim{eim} is in the fleeting closure of \Veim{bas}.

We now consider the case where
$\Dotix{\Veim{eim}} > 0$ and $\Predot{\Veim{eim}} = \epsilon$.
By
\eqref{eq:eim-lasting-base-23},
we know that if
\[
\var{i} = \xxsubtract{\Dotix{\Veim{eim}}}{\Dotix{\Veim{bas}}}
\]
then
all of the \myfnname{null-scan-op} operations are
well-defined in
\begin{equation}
\label{eq:eim-lasting-base-27}
\myfnname{null-scan-op}^{\displaystyle (\var{i})}(\Veim{bas}) = \Veim{eim}.
\end{equation}

From
Theorem
\ref{t:null-scan-from-down-cause},
the assumption for that theorem that $\Valid{\Veim{eim}}$,
and the definition of \myfnname{null-scan-op},
we know that, if $\Postdot{\Veim{down}} = \epsilon$,
then
\begin{equation}
\label{eq:eim-lasting-base-30}
\op{null-scan-op}{\Veim{down}} = \Veim{eim} \implies
\Valid{\Veim{down}}.
\end{equation}
Using
\eqref{eq:eim-lasting-base-23}
and
\eqref{eq:eim-lasting-base-30},
we see that in
\eqref{eq:eim-lasting-base-27},
\Veim{bas} is valid.
\eqref{eq:eim-lasting-base-27}
shows directly that \Veim{eim} is in the fleeting closure
of \Veim{bas}.

It remains to show that \Veim{bas} is unique.
\eqref{eq:eim-lasting-base-25}
and
\eqref{eq:eim-lasting-base-27}
show that for any lasting base,
call it \Veim{bas},
\Veim{eim} must be in its fleeting closure.
so that
\begin{equation}
\el{fc}{0} = \Veim{bas} \; \land \;
\exists \var{a} : \Vel{fc}{a} = \Veim{eim},
\end{equation}
where \var{fc} is the fleeting closure of \Veim{bas}.

Assume for a reductio,
that \Veim{bas1} and \Veim{bas2}
are
two different lasting bases
of \Veim{eim}.
Let the fleeting closure of \Veim{bas1} be \var{fc1}
and let the fleeting closure of \Veim{bas2} be \var{fc2}.
Using Theorem \ref{t:null-scan-arithmetic},
we have, for some \var{ix1}, \var{ix2},
\begin{multline}
\label{t:eim-lasting-base-40}
 \Veim{eim} = \Vel{ns1}{ix1} =
\\
\left[
\begin{gathered}
  [
\Rule{\Veim{bas1}}, (\Dotix{\Veim{bas1}} + \var{ix1}) ], \\
  \Left{\Veim{bas1}},
  \Current{\Veim{bas1}},
\end{gathered}
\right]
\end{multline}
and
\begin{multline}
\label{t:eim-lasting-base-42}
 \Veim{eim} = \Vel{ns2}{ix2} =
\\
\left[
\begin{gathered}
  [
\Rule{\Veim{bas2}}, (\Dotix{\Veim{bas2}} + \var{ix2}) ], \\
  \Left{\Veim{bas2}},
  \Current{\Veim{bas2}},
\end{gathered}
\right]
\end{multline}

By assumption for the reductio,
\begin{equation}
\label{eq:eim-lasting-base-48}
\Veim{bas1} \neq \Veim{bas2}.
\end{equation}
From
\eqref{t:eim-lasting-base-40}
and
\eqref{t:eim-lasting-base-42},
we know that
\begin{equation}
\label{eq:eim-lasting-base-49}
\begin{gathered}
\Rule{\Veim{eim}}  = \Rule{\Veim{bas1}} \; \land \\
\Left{\Veim{eim}}  = \Left{\Veim{bas1}} \; \land \\
\Current{\Veim{eim}}  = \Current{\Veim{bas1}} \; \land \\
\Rule{\Veim{eim}}  = \Rule{\Veim{bas2}} \; \land \\
\Left{\Veim{eim}}  = \Left{\Veim{bas2}} \; \land \\
\Current{\Veim{eim}}  = \Current{\Veim{bas2}},
\end{gathered}
\end{equation}
so that
\begin{equation}
\label{eq:eim-lasting-base-50}
\begin{gathered}
\Rule{\Veim{bas1}}  = \Rule{\Veim{bas2}} \; \land \\
\Left{\Veim{bas1}}  = \Left{\Veim{bas2}} \; \land \\
\Current{\Veim{bas1}}  = \Current{\Veim{bas2}}.
\end{gathered}
\end{equation}
From
\eqref{eq:eim-lasting-base-50}
we see that we have
\eqref{eq:eim-lasting-base-48}
only if
\[
 \Dotix{\Veim{bas1}} \neq \Dotix{\Veim{bas2}}.
\]
Without loss of generality,
we assume that
\begin{equation}
\label{eq:eim-lasting-base-52}
 \Dotix{\Veim{bas1}} < \Dotix{\Veim{bas2}}.
\end{equation}

From
\eqref{t:eim-lasting-base-40}
and
\eqref{t:eim-lasting-base-42},
\begin{gather}
\notag
\Dotix{\Veim{eim}} = \Dotix{\Veim{bas2}} + \var{ix2} \\
\label{eq:eim-lasting-base-54}
\therefore \; \Dotix{\Veim{bas2}} < \Dotix{\Veim{eim}}
\end{gather}

By the definition of a lasting base for an EIM,
\begin{equation}
\label{eq:eim-lasting-base-55}
\begin{aligned}
& \forall \; \var{a} : \Dotix{\Veim{bas1}} \le \var{a} < \Dotix{\Veim{eim}} \\
& \qquad \implies \RHS{\Veim{bas1}, \var{a}} = \epsilon
\end{aligned}
\end{equation}

From
\eqref{eq:eim-lasting-base-49}
we have
\begin{equation}
\label{eq:eim-lasting-base-57}
\Rule{\Veim{eim}} = \Rule{\Veim{bas1}} = \Rule{\Veim{bas2}}
\end{equation}
From
\eqref{eq:eim-lasting-base-52},
\eqref{eq:eim-lasting-base-54},
\eqref{eq:eim-lasting-base-55}
and
\eqref{eq:eim-lasting-base-57},
we see that
\[
    \Predot{\Veim{bas2}} = \epsilon.
\]
But by assumption for the reduction, \Veim{bas2} was
a lasting base, and by the definition of a lasting base,
a lasting base cannot have a nulling predot symbol.
This contradiction shows the reductio,
and we see that $\Veim{bas1} = \Veim{bas2}$.
Since the choice of \Veim{bas1} and \Veim{bas2} was
without loss of generality,
we see that no EIM has more than one distinct lasting base.
\end{proof}

\begin{theorem}
\ttitle{Partial fleeting closure validity}
\label{t:partial-fleeting-closure-validity}
Let \Veim{eim} be a valid EIM,
and let \var{ns} be its fleeting closure.
Then
every
EIM in \var{ns}
valid;
for all \var{a}
such that
$0 \le \var{a} \le \decr{\Vlastix{ns}}$,
\Vel{ns}{a} is the unique top-down cause of
\el{ns}{\Vincr{a}}; and
\el{ns}{\Vincr{a}}
is the unique effect of \Vel{ns}{a}.
\end{theorem}

\begin{proof}
A fleeting closure, by its definition,
is zero or more iterations
of the \myfnname{null-scan-op} operation.
For zero operations, the theorem follows
trivially.
For a single operation,
the theorem follows from Theorem
\ref{t:null-scan-from-down-cause}.
The general case can be shown by induction
on the number of
\myfnname{null-scan-op} operations
in the fleeting closure.
\end{proof}

\begin{definition}
\dtitle{Maximal fleeting closure}
The
\dfn{maximal fleeting closure}
of an EIM is the fleeting closure
of its lasting base.
\end{definition}

\begin{theorem}
\ttitle{Maximal fleeting closure validity}
\label{t:maximal-fleeting-closure-validity}
Let \Veim{eim} be a valid EIM.
Then
\begin{gather}
\label{t:maximal-fleeting-closure-validity-10}
\myparbox{\Veim{eim}
has exactly one
maximal fleeting closure,
call it \var{bns};
} \\
\label{t:maximal-fleeting-closure-validity-13}
\myparbox{every
EIM in \var{bns} is
valid;
} \\
\label{t:maximal-fleeting-closure-validity-16}
\myparbox{
for all \var{a}
such that
$0 \le \var{a} \le \decr{\Vlastix{bns}}$,
\Vel{bns}{a} is the unique top-down cause of
\el{bns}{\Vincr{a}}; and
} \\
\label{t:maximal-fleeting-closure-validity-19}
\myparbox{
for all \var{a}
such that
$0 \le \var{a} \le \decr{\Vlastix{bns}}$,
\el{bns}{\Vincr{a}}
is the unique effect of \Vel{bns}{a}.
}
\end{gather}
\end{theorem}

\begin{proof}
Theorems
\ref{t:eim-lasting-base}
and
\ref{t:partial-fleeting-closure-validity}
show
\eqref{t:maximal-fleeting-closure-validity-13},
\eqref{t:maximal-fleeting-closure-validity-16},
\eqref{t:maximal-fleeting-closure-validity-19}
and
that \Veim{eim} has at least one maximal
fleeting closure.

To prove
\eqref{t:maximal-fleeting-closure-validity-10}
and the theorem,
it remains to show that \Veim{eim}
has at most one distinct maximal fleeting closure.
To do this,
we will assume
that \var{mfc1} and \var{mfc2}
are two maximal fleeting closures
such that
\[
\Veim{eim} \in \var{mfc1}
\; \land \;
\Veim{eim} \in \var{mfc2}
\]
to show that
\begin{equation}
\forall \; \var{a} : \Vel{mfc1}{a} = \Vel{mfc2}{a}.
\end{equation}

We proceed by induction,
where
\begin{equation}
\label{t:maximal-fleeting-closure-validity-30}
\tag{IND}
\Vel{mfc1}{x} = \Vel{mfc2}{x}.
\end{equation}
is the induction hypothesis.
Here \var{mfc1} and \var{mfc2} can be (and in fact always are)
partial functions.
Recall that we write $\Vel{fc}{x} = \undefined$ to
say the ``\myfnname{f} is undefined at \var{x}''.
Also recall that,
for all \var{x}, \var{y},
if $\var{x} = \undefined$,
then $\var{x} \, = \, \var{y} \; \equiv \; \var{y} \, = \, \undefined$.


By the definition of a maximal fleeting closure, its first
element is a lasting base of \Veim{eim}.
By Theorem
\ref{t:eim-lasting-base},
\Veim{eim} has at most one distinct lasting base,
which shows that
\[
\el{mfc1}{0} = \el{mfc2}{0}.
\]
which is
\eqref{t:maximal-fleeting-closure-validity-30}
for $\var{x} = 0$.
We take this as the basis of our induction.

For the step of the induction, we
assume
\eqref{t:maximal-fleeting-closure-validity-30}
for $\var{x} = \var{i}$,
to show
\eqref{t:maximal-fleeting-closure-validity-30}
for $\var{x} = \Vincr{i}$.
Within the step we proceed by cases,
based on the value of \Vel{mfc1}{i}.
In what follows, we will use the fact that
a fleeting closure is defined in terms of
\myfnname{null-scan-op},
so that
\begin{align}
\label{t:maximal-fleeting-closure-validity-36}
& \el{mfc1}{\Vincr{i}} = \op{null-scan-op}{\Vel{mfc1}{i}} &&
\\
\label{t:maximal-fleeting-closure-validity-38}
& \el{mfc2}{\Vincr{i}} = \op{null-scan-op}{\Vel{mfc2}{i}} &&
\end{align}

In the first case
\Vel{mfc1}{i} is defined,
and
$\Postdot{\Vel{mfc1}{i}} \neq \epsilon$.
\begin{align}
\label{t:maximal-fleeting-closure-validity-44}
& \Vel{mfc1}{i} \neq \undefined && \text{case ASM}
\\
\label{t:maximal-fleeting-closure-validity-46}
& \Postdot{\Vel{mfc1}{i}} \neq \epsilon && \text{case ASM}
\\
\label{t:maximal-fleeting-closure-validity-48}
& \Vel{mfc2}{i} \neq \undefined &&
\eqref{t:maximal-fleeting-closure-validity-44},
\text{step ASM}
\\
\label{t:maximal-fleeting-closure-validity-50}
& \Postdot{\Vel{mfc2}{i}} \neq \epsilon &&
\eqref{t:maximal-fleeting-closure-validity-46},
\text{step ASM}
\end{align}
Recalling that \myfnname{null-scan-op} is a null-scan,
so that \op{null-scan-op}{\Veim{x}} is only defined if the postdot symbol of \Veim{x}
is nulling,
\begin{align}
\label{t:maximal-fleeting-closure-validity-54}
& \op{null-scan-op}{\Vel{mfc1}{i}} = \undefined &&
\eqref{t:maximal-fleeting-closure-validity-46}
\\
\label{t:maximal-fleeting-closure-validity-56}
& \op{null-scan-op}{\Vel{mfc2}{i}} = \undefined &&
\eqref{t:maximal-fleeting-closure-validity-50}.
\end{align}
\begin{align}
\label{t:maximal-fleeting-closure-validity-64}
& \el{mfc1}{\Vincr{i}} = \undefined &&
\eqref{t:maximal-fleeting-closure-validity-36},
\eqref{t:maximal-fleeting-closure-validity-54}
\\
\label{t:maximal-fleeting-closure-validity-66}
& \el{mfc2}{\Vincr{i}} = \undefined &&
\eqref{t:maximal-fleeting-closure-validity-38},
\eqref{t:maximal-fleeting-closure-validity-56}
\\
\label{t:maximal-fleeting-closure-validity-70}
& \el{mfc1}{\Vincr{i}} = \el{mfc2}{\Vincr{i}}
&&
\eqref{t:maximal-fleeting-closure-validity-64},
\eqref{t:maximal-fleeting-closure-validity-66}
\end{align}
\eqref{t:maximal-fleeting-closure-validity-70}
shows the step for the first case.

In the second case
\Vel{mfc1}{i} is defined,
and
$\Postdot{\Vel{mfc1}{i}} = \epsilon$.
\begin{align}
\label{t:maximal-fleeting-closure-validity-74}
& \Vel{mfc1}{i} \neq \undefined && \text{case ASM}
\\
\label{t:maximal-fleeting-closure-validity-76}
& \Postdot{\Vel{mfc1}{i}} = \epsilon && \text{case ASM}
\\
\label{t:maximal-fleeting-closure-validity-78}
& \Vel{mfc2}{i} \neq \undefined &&
\eqref{t:maximal-fleeting-closure-validity-74},
\text{step ASM}
\\
\label{t:maximal-fleeting-closure-validity-80}
& \Postdot{\Vel{mfc2}{i}} = \epsilon &&
\eqref{t:maximal-fleeting-closure-validity-76},
\text{step ASM}
\\
\label{t:maximal-fleeting-closure-validity-82}
& \Vel{mfc1}{i} = \Vel{mfc2}{i} &&
\text{step ASM}
\end{align}
In Theorem
\ref{t:null-scan-from-down-cause},
we showed the \myfnname{null-scan-op} is a function,
so that from
\eqref{t:maximal-fleeting-closure-validity-36},
\eqref{t:maximal-fleeting-closure-validity-38}
and
\eqref{t:maximal-fleeting-closure-validity-82}
we have
\[
\el{mfc1}{\Vincr{i}} = \el{mfc2}{\Vincr{i}},
\]
which shows the step for the second case.

In the third case,
\Vel{mfc1}{i} is undefined.
By assumption for the step,
this means that
\Vel{mfc2}{i} is also undefined,
so that
\begin{equation}
\label{t:maximal-fleeting-closure-validity-90}
\begin{gathered}
  \el{mfc1}{\Vincr{i}} = \op{null-scan-op}{\Vel{mfc1}{i}} \\
  = \el{mfc2}{\Vincr{i}} = \op{null-scan-op}{\Vel{mfc2}{i}} = \undefined,
\end{gathered}
\end{equation}
\eqref{t:maximal-fleeting-closure-validity-90}
shows the step for the third case.

We have now shown the step of the induction for all three cases.
This gives us the induction,
\eqref{t:maximal-fleeting-closure-validity-10},
and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Fleeting closure maximization}
\label{t:fleeting-closure-maximization}
If two EIM's are in the same fleeting closure,
then they are also in the same maximal fleeting closure.
\end{theorem}

\begin{proof}
Let \Veim{eim1} and \Veim{eim2} be two EIM's
in the same fleeting closure.
Without loss of generality, we assume that
\begin{equation}
\label{eq:fleeting-closure-maximization-10}
\Veim{eim2} = \iop{null-scan-op}{\var{y}}{\Veim{eim1}}
\end{equation}
By Theorem
\ref{t:maximal-fleeting-closure-validity}
an EIM is in
exactly one maximal fleeting closure,
so that
\begin{gather}
\notag
\Veim{eim1} = \iop{null-scan-op}{\var{x}}{\Veim{bas1}} \\
\label{eq:fleeting-closure-maximization-16}
\text{and} \quad
\Veim{eim2} = \iop{null-scan-op}{\var{z}}{\Veim{bas2}}
\end{gather}
where \Veim{bas1} and \Veim{bas2} are lasting bases.
Since \myfnname{null-scan-op} is a function with an inverse,
we know that
\begin{gather}
\notag
\Veim{eim2} = \iop{null-scan-op}{\var{y}}{
 \iop{null-scan-op}{\var{x}}{\Veim{bas1}}
} \\
\label{eq:fleeting-closure-maximization-19}
\therefore \quad
\Veim{eim2} = \iop{null-scan-op}{(\var{x}+\var{y})}{\Veim{bas1}}
\end{gather}
Since \Veim{bas1} is the lasting base of \Veim{eim1},
\Veim{bas1} is a lasting base,
so that by
\eqref{eq:fleeting-closure-maximization-19}
and the definition of the lasting base of an EIM,
\Veim{bas1} is the lasting base of \Veim{eim2}.
Since an EIM has at most one lasting base,
we can conclude from
\eqref{eq:fleeting-closure-maximization-16}
and
\eqref{eq:fleeting-closure-maximization-19}
that $\var{x}+\var{y}=\var{z}$ and that
\begin{equation}
\label{eq:fleeting-closure-maximization-22}
\Veim{bas1} = \Veim{bas2},
\end{equation}

From
\eqref{eq:fleeting-closure-maximization-22}
we see that \Veim{bas1} is the lasting base of both
\Veim{eim1} and \Veim{eim2}.
From Theorem
\ref{t:maximal-fleeting-closure-validity},
we know that \Veim{bas1} has exactly one maximal fleeting closure.
By Theorem
\ref{t:eim-lasting-base},
every EIM is in the fleeting closure of its lasting base,
so that
\Veim{eim1} and \Veim{eim2}
are both in \var{mfc}.
\end{proof}

\begin{theorem}
\ttitle{Quasi-complete fleeting closure properties}
\label{t:quasi-complete-fleeting-closure-properties}
Let
\begin{equation}
\label{eq:quasi-complete-fleeting-closure-properties-5}
\Veim{down} = \big[ [ \Vrule{r}, \var{lo} ], \var{i}, \var{k} \big],
\end{equation}
be a valid quasi-complete EIM,
and let \Veim{bas} be its lasting base.
If the series \var{ns} is the fleeting closure of
either \Veim{bas} or \Veim{down},
then we have all of the following:
\begin{align}
\label{eq:quasi-complete-fleeting-closure-properties-9}
& \text{\var{ns} contains at most \Vsize{\Vrule{r}}
  elements
}
\\
\label{eq:quasi-complete-fleeting-closure-properties-10}
& \text{$\var{ns}\big[ \Vlastix{ns} \big]$
  is a complete EIM
}
\\
\label{eq:quasi-complete-fleeting-closure-properties-12}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} < \Vlastix{ns} \\
& \quad \implies \text{\Vel{ns}{a} is an incomplete EIM}
\end{aligned}
\\
\label{eq:quasi-complete-fleeting-closure-properties-13}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{ns} \\
& \quad \implies \text{\Vel{ns}{a} is an quasi-complete EIM}
\end{aligned}
\\
\label{eq:quasi-complete-fleeting-closure-properties-14}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{ns}
  \implies \Valid{\Vel{ns}{a}}
\end{aligned}
\\
\label{eq:quasi-complete-fleeting-closure-properties-16}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{ns} \\
& \qquad \implies \Right{\el{ns}{0}} = \Right{\Vel{ns}{a}}
\end{aligned}
\\
\label{eq:quasi-complete-fleeting-closure-properties-18}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{ns} \\
& \qquad \implies \op{Rule}{\el{ns}{0}} = \op{Rule}{\Vel{ns}{a}}
\end{aligned}
\\
\label{eq:quasi-complete-fleeting-closure-properties-20}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \decr{\Vlastix{ns}} \\
& \qquad \implies \text{\Vel{ns}{a} is the
  unique top-down cause of
  \el{ns}{\Vincr{a}}
}
\end{aligned}
\\
\label{eq:quasi-complete-fleeting-closure-properties-22}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \decr{\Vlastix{ns}} \\
& \qquad \implies \text{\el{ns}{\Vincr{a}}
  is the unique effect of \Vel{ns}{a}
}
\end{aligned}
\end{align}
\end{theorem}

\begin{proof}
We first consider \Veim{bas}.
By assumption for the theorem,
\Veim{bas} is the lasting base of \Veim{down}.
By Theorem \ref{t:eim-lasting-base}, \Veim{down}
has a valid lasting base:
\begin{equation}
\label{eq:quasi-complete-fleeting-closure-properties-24a}
\Valid{\Veim{bas}}.
\end{equation}
By assumption for theorem, \Veim{down}
is quasi-complete,
so that, by the definition
of quasi-complete, all the symbols
in the dot suffix of \Veim{down}
are nulling.
By the definition of a lasting base,
all of the symbols between
\Dotix{\Veim{bas}}
and
\Dotix{\Veim{down}}
are nulling.
Therefore all of the symbols in the dot
suffix of \Veim{bas} are nulling,
so that, by the definition of quasi-complete,
\begin{equation}
\label{eq:quasi-complete-fleeting-closure-properties-24b}
\text{\Veim{bas} is quasi-complete.}
\end{equation}

We will next show the requirements of the theorem
for \Veim{quasi},
an EIM which is valid and quasi-complete,
and which otherwise is chosen without
loss of generality.
Let
\var{ns1} be the fleeting closure of \Veim{quasi}.
We have,
using
Theorem
\ref{t:partial-fleeting-closure-validity},
Requirements
\eqref{eq:quasi-complete-fleeting-closure-properties-14},
\eqref{eq:quasi-complete-fleeting-closure-properties-20}
and
\eqref{eq:quasi-complete-fleeting-closure-properties-22}
for the theorem.

Because \Veim{quasi},
is a quasi-complete EIM,
we know that
\begin{multline}
\label{eq:quasi-complete-fleeting-closure-properties-28}
\el{ns1}{0} = \Veim{quasi} \\
\text{and} \quad
  \forall \; \var{a} : 0 \le \var{a} < (\xxsubtract{\Vsize{\Vrule{r}}}{\var{lo}})
\\
\implies
\el{ns1}{\Vincr{a}} =
\big[ [ \Vrule{r}, \var{lo}+\var{a}+1 ], \var{i}, \var{k} \big].
\end{multline}
and
\begin{equation}
\label{eq:quasi-complete-fleeting-closure-properties-30}
\forall \; \var{a} : 0 \le \var{a} < (\xxsubtract{\Vsize{\Vrule{r}}}{\var{lo}})
  \implies \Vop{RHS}{\Vrule{r}, \var{lo}+\var{a}} = \epsilon
\end{equation}

From
\eqref{eq:quasi-complete-fleeting-closure-properties-28},
we can see that
\begin{gather*}
\Vlastix{ns1} = \xxsubtract{\Vsize{\Vrule{r}}}{\var{lo}}, \quad
\text{so that}  \\
\begin{aligned}
\op{Dotix}{\var{ns1}\big[\Vlastix{ns1}\big]}
& = \var{lo} + (\decr{( \xxsubtract{\Vsize{\Vrule{r}}}{\var{lo}}) }) + 1 \\
& = \Vsize{\Vrule{r}}
\end{aligned}
\end{gather*}
which shows
\eqref{eq:quasi-complete-fleeting-closure-properties-10}.
Simlarly,
we see
from
\eqref{eq:quasi-complete-fleeting-closure-properties-28},
\begin{equation*}
\begin{aligned}
&& \var{ix} & < \Vlastix{ns1} \\
\implies && \op{Dotix}{\Vel{ns1}{ix}}
& < \var{lo} + (\decr{( \xxsubtract{\Vsize{\Vrule{r}}}{\var{lo}}) }) + 1 \\
\implies && \op{Dotix}{\Vel{ns1}{ix}}
& < \Vsize{\Vrule{r}}
\end{aligned}
\end{equation*}
shows
\eqref{eq:quasi-complete-fleeting-closure-properties-12}.

We see from
\eqref{eq:quasi-complete-fleeting-closure-properties-28}
that every element of \var{ns1},
is an EIM which differs from
the other elements of \var{ns1}
only in its dot index,
which gives us
\eqref{eq:quasi-complete-fleeting-closure-properties-16}
and
\eqref{eq:quasi-complete-fleeting-closure-properties-18}.
From
\eqref{eq:quasi-complete-fleeting-closure-properties-28},
we also see that
\begin{equation}
\var{ix} > 0 \implies \Dotix{\Vel{ns1}{ix}} > \Dotix{\el{ns1}{0}}
\end{equation}
so that using
\eqref{eq:quasi-complete-fleeting-closure-properties-30},
\begin{equation}
\label{eq:quasi-complete-fleeting-closure-properties-40}
\begin{gathered}
\forall \; \var{nsix}, \var{rhix} :
0 \le \var{nsix} \le \Vlastix{ns1} \\
\land \;
\Dotix{\Vel{ns1}{nsix}} \le \var{rhix} \le \Vsize{\Vrule{r}} \\
\implies
\Vop{RHS}{\Vrule{r}, \var{rhix}} = \epsilon
\end{gathered}
\end{equation}
and since every layer of \var{ns1} shares the same rule,
\eqref{eq:quasi-complete-fleeting-closure-properties-40}
shows
\eqref{eq:quasi-complete-fleeting-closure-properties-13}.

As we already noted, the layers of \var{ns1} differ
\textbf{only} in their dot index.
There are at most
distinct dot \incr{\Vsize{\Vrule{r}}} indexes.
By
\eqref{eq:quasi-complete-fleeting-closure-properties-13},
every layer is quasi-complete,
so that,
by Theorem \ref{t:quasi-drs-disjoint},
no layer is a prediction.
Therefore no layer of \var{ns1} uses dot index 0.
So that there are at most
\Vsize{\Vrule{r}} layers in \var{ns1},
which shows
\eqref{eq:quasi-complete-fleeting-closure-properties-9}.
With this, we have shown the last of the requirements
for the theorem for \Veim{quasi}.

We have shown the requirement for the theorem for \Veim{quasi},
a valid quasi-complete EIM.
By assumption for theorem, \Veim{down} is a valid quasi-complete
EIM,
and therefore we have shown the requirements
for the theorem for \Veim{down}.
From
\eqref{eq:quasi-complete-fleeting-closure-properties-24a}
and
\eqref{eq:quasi-complete-fleeting-closure-properties-24b},
we know that \Veim{bas} is a valid quasi-complete EIM,
and therefore we have shown the requirements
for the theorem for \Veim{bas} as well.
\end{proof}

\section{Ambiguity}

\begin{theorem}
\ttitle{Multiple top-down causes make a grammar ambiguous}
\label{t:multi-down-cause-ambiguous}
If any confirmed Earley item has more than one top-down cause,
the grammar is ambiguous.
\end{theorem}

\begin{proof}
Assume for a reductio, that the confirmed EIM \Veim{effect} has more than one top-down cause,
but that \Cg{} is not ambiguous.
Without loss of generality,
let \Veim{effect} be
\begin{equation}
\label{eq:multi-down-cause-ambiguous-20}
\Veim{effect} =
[ [ \Vsym{down} \de \Vstr{pre} \cat \Vsym{A} \mydot \Vstr{post} ], \var{i}, \var{k} ].
\end{equation}
Since \Veim{effect} is confirmed,
the dotted rule and origin of its top-down cause are determined by \Veim{effect}
\dref[causes of confirmed EIM]{def:causes-confirmed}.
Therefore, if \Veim{effect} has two distinct
top-down causes, they can differ only in their current position.
Let the two distinct top-down causes be
\begin{gather*}
\Veim{down1} = [ [ \Vsym{down} \derives \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j1} ] \\
\Veim{down2} = [ [ \Vsym{down} \derives \Vstr{pre} \mydot \Vsym{A} \cat \Vstr{post} ], \var{i}, \var{j2} ]
\end{gather*}
From these we get the two derivations:
\begin{gather*}
\Vsym{down} \derives \Vmk{i} \Vstr{pre} \Vmk{j1} \Vsym{A} \Vstr{post} \\
\Vsym{down} \derives \Vmk{i} \Vstr{pre} \Vmk{j2} \Vsym{A} \Vstr{post}
\end{gather*}
These will be different factorings of the input if $\var{j1} \neq \var{j2}$.
By assumption for the reductio, \Cg{} is not ambiguous,
and therefore no derivation step can allow two different factorings of the input.
So $\var{j1} = \var{j2}$.
But then $\Veim{down1} = \Veim{down2}$, which is contrary to assumption
for the reductio.
\end{proof}

\begin{theorem}
\ttitle{Multiple bottom-up causes make a grammar ambiguous}
\label{t:multi-up-cause-ambiguous}
If any confirmed Earley item has more than one bottom-up cause,
the grammar is ambiguous.
\end{theorem}

\begin{proof}
Assume for a reductio that
the confirmed \Veim{effect} has more than one bottom-up cause
but that \Cg{} is not ambiguous.
Without loss of generality,
let \Veim{effect} be
\begin{equation}
\label{eq:multi-up-cause-ambiguous-10}
\Veim{effect} =
\big[ [ \Vsym{down} \de \Vstr{pre} \cat \Vsym{A} \mydot \Vstr{post} ], \var{i}, \var{k}
\big]
\end{equation}
and call the two differing bottom-up causes, \Vinst{up1}
and \Vinst{up2}.
\Veim{effect} is confirmed by assumption for the theorem,
so that by
\dref[causes of confirmed EIM]{def:causes-confirmed},
\begin{gather}
\label{eq:multi-up-cause-ambiguous-15}
\Right{\var{up1}} = \Right{\var{up2}} \; \text{and} \\
\label{eq:multi-up-cause-ambiguous-16}
\Symbol{\var{up1}} = \Symbol{\var{up2}}.
\end{gather}
Therefore
\Vinst{up1} and \Vinst{up2}
can differ only in their left location, or in their EIM equivalent.

We now consider whether 
\Vinst{up1} and \Vinst{up2}
can differ in their left location:
\begin{align}
\label{eq:multi-up-cause-ambiguous-20}
& \myparbox{ %
\Veim{effect} is a confirmed EIM
\becuz{}
ASM for reductio.
} \\
\label{eq:multi-up-cause-ambiguous-22}
& \myparbox{ %
The bottom-up causes of \Veim{effect} have matching down causes
\becuz{}
\eqref{eq:multi-up-cause-ambiguous-20},
\tref{t:symbolic-causes-from-effect}.
} \\
\label{eq:multi-up-cause-ambiguous-24}
& \myparbox{ %
If two bottom-up causes differ in their left location,
their matching down causes will differ in their right location
\becuz{}
\dref[matching causes]{def:matching-causes}.
} \\
\label{eq:multi-up-cause-ambiguous-26}
& \myparbox{ %
If \Veim{effect} has two different top-down causes,
\Cg{} is ambiguous.
\becuz{}
\eqref{eq:multi-up-cause-ambiguous-20},
\tref{t:multi-down-cause-ambiguous}.
} \\
\label{eq:multi-up-cause-ambiguous-28}
& \myparbox{ %
\Cg{} is not ambiguous by assumption for the reductio.
} \\
\label{eq:multi-up-cause-ambiguous-30}
& \myparbox{ %
$\Left{\var{up1}} = \Left{\var{up2}}$
because
\eqref{eq:multi-up-cause-ambiguous-24},
\eqref{eq:multi-up-cause-ambiguous-26},
\eqref{eq:multi-up-cause-ambiguous-28}.
}
\end{align}

Since
$\Symbol{\var{up1}} = \Symbol{\var{up2}}$,
and every symbol is either a terminal or a non-terminal,
two bottom-up causes cannot differ in whether they have an EIM equivalent.
Theorem
\ref{t:eim-equivalent-from-non-terminal}
shows that an parse instance has an EIM equivalent
if and only if its symbol is a non-terminal,
so we know that
if \var{up1} has no EIM equivalent,
then \var{up2} has no EIM equivalent.
But if both
\var{up1} and
\var{up2} have no EIM equivalent,
they consist entirely of their parse symbol instance,
so that by
\eqref{eq:multi-up-cause-ambiguous-15},
\eqref{eq:multi-up-cause-ambiguous-16}
and
\eqref{eq:multi-up-cause-ambiguous-30},
they are identical.

It remains to examine the case where bottom-up causes differ in their EIM equivalent.
By
\eqref{eq:multi-up-cause-ambiguous-15}
and \eqref{eq:multi-up-cause-ambiguous-16}
the symbol and right location of the two bottom-up causes must be the same.
\dref[causes of confirmed EIM]{def:causes-confirmed}.
The left locations of \Veim{up1} and \Veim{up2} must be identical
\eqref{eq:multi-up-cause-ambiguous-30}.
So the two bottom-up causes can differ only in the RHS of their dotted rule.
An EIM bottom-up cause of \Veim{effect}
must be a complete EIM \becuz{}
\eqref{eq:multi-up-cause-ambiguous-20}.
Therefore
without loss of generalization,
let the two differing bottom-up causes be
\begin{gather*}
\Veim{up1} = \big[ [ \Vsym{up} \derives \Vstr{up-rhs1} \mydot ], \var{j}, \var{k}
\big] \\
\Veim{up2} = \big[ [ \Vsym{up} \derives \Vstr{up-rhs2} \mydot ], \var{j}, \var{k}
\big].
\end{gather*}

From these we get the two derivations:
\begin{gather*}
\Vsym{up1} \derives \Vmk{j} \Vstr{up-rhs1} \Vmk{k} \\
\Vsym{up1} \derives \Vmk{j} \Vstr{up-rhs2} \Vmk{k}
\end{gather*}
These will be different derivations of the input if
$\Vstr{up-rhs1} \neq \Vstr{up-rhs2}.$
By assumption for the reductio, \Cg{} is not ambiguous,
and therefore no derivation step can allow two different sentential forms.
So $\Vstr{up-rhs1} = \Vstr{up-rhs2}.$
But then $\Veim{up1} = \Veim{up2}$, which is contrary to assumption
for the reductio.\qedhere
\end{proof}

\chapter{Tethers}
\label{ch:tethers}

\begin{theorem}
\ttitle{Right location of top-down cause}
\label{t:right-location-of-top-down-cause}
Let \Veim{effect} be a valid EIM other than
the start EIM.
Then it has a top-down cause,
that cause is an EIM, call it \Veim{down},
and
\begin{align}
\label{req:right-location-of-top-down-cause-3}
& \rlap{$\Right{\Veim{down}} = \Right{\Veim{effect}}$} & \\
& \qquad \qquad \text{if \Veim{effect} is a prediction,} & \notag \\
\label{req:right-location-of-top-down-cause-4}
& \rlap{$\Right{\Veim{down}} = \Right{\Veim{effect}}$} & \\
& \qquad \qquad \text{if \Veim{effect} is a null-scan,} & \notag\\
\label{req:right-location-of-top-down-cause-6}
& \rlap{$\Right{\Veim{down}} = \decr{\Right{\Veim{effect}}}$} & \\
& \qquad \qquad \text{if \Veim{effect} is read.} & \notag\\
\label{req:right-location-of-top-down-cause-9}
& \rlap{$\Right{\Veim{down}} < \Right{\Veim{effect}}$} & \\
& \qquad \qquad \text{if \Veim{effect} is a reduction.} & \notag
\end{align}
\end{theorem}

\begin{proof}
If \Veim{effect} is a prediction,
this theorem follows from
Theorem \ref{t:prediction-from-cause}.
This shows Requirement~\ref{req:right-location-of-top-down-cause-3}.

For the remaining cases,
we will
use Theorem \ref{t:symbolic-causes-from-effect}
to show that \Veim{down} is the matching
cause of a symbolic instance.
Call that instance, \Vinst{up},
and let its length be
\begin{equation}
\label{eq:right-location-of-top-down-cause-12}
\Vsize{\Vinst{up}} =
(\Right{\Vinst{up}} \subtract \Left{\Vinst{up}}).
\end{equation}
From Theorem \ref{t:symbolic-causes-from-effect},
we know that
\begin{equation}
\label{eq:right-location-of-top-down-cause-15}
\Right{\Vinst{up}} = \Right{\Veim{effect}}
\end{equation}
From the definition of matching causes,
\begin{equation}
\label{eq:right-location-of-top-down-cause-18}
\Right{\Veim{down}} = \Left{\Vinst{up}}.
\end{equation}
Using
\eqref{eq:right-location-of-top-down-cause-12},
\eqref{eq:right-location-of-top-down-cause-15}
and
\eqref{eq:right-location-of-top-down-cause-18}
we see that
\begin{equation}
\label{eq:right-location-of-top-down-cause-21}
\Right{\Veim{effect}} = \Right{\Veim{down}} + \Vsize{\Vinst{up}}.
\end{equation}

If \Veim{effect} is a null scan, \Vinst{up} is
a nulling symbol instance,
$\Vsize{\Vinst{up}} = 0$.
Using
\eqref{eq:right-location-of-top-down-cause-21},
we have
\[
  \Right{\Veim{down}} = \Right{\Veim{effect}},
\]
which is Requirement~\ref{req:right-location-of-top-down-cause-4}.

If \Veim{effect} is a read, \Vinst{up} is
a terminal symbol instance,
$\Vsize{\Vinst{up}} = 1$.
Using
\eqref{eq:right-location-of-top-down-cause-21}
\[
  \Right{\Veim{down}} = \Right{\Veim{down}} \subtract 1,
\]
which is Requirement~\ref{req:right-location-of-top-down-cause-6}.

If \Veim{effect} is a reduction, \Vinst{up} is
a non-terminal symbol instance,
$\Vsize{\Vinst{up}} \ge 1$.
Using
\eqref{eq:right-location-of-top-down-cause-21}
\[
  \Right{\Veim{down}} < \Right{\Veim{effect}},
\]
which is Requirement~\ref{req:right-location-of-top-down-cause-9}.

\end{proof}

\begin{definition}
\label{def:tether}
\dtitle{Tether}
Let \Veim{base} be an Earley item.
The sequence
\begin{equation}
\el{teth}{0},
\el{teth}{1},
\ldots
\Vel{teth}{top}, \quad \text{where $\var{top} \ge 1$}
\end{equation}
is a
\dfn{tether}
of \Veim{base} if and only if
\begin{align}
\label{eq:def-tether-10}
& \el{teth}{0} = \Veim{eim},
\\
\label{eq:def-tether-20}
& \text{\Vel{teth}{top} is the start EIM, and}
\\
\label{eq:def-tether-30}
& \myparbox{
for all \var{x} such that
$\var{top} > \var{x} \ge 0,$
\el{teth}{\Vincr{x}} is a top-down cause of
\Vel{teth}{x}.
}
\end{align}
We sometimes say that
\Veim{eim} ``has'' the tether \var{teth}.
\end{definition}

Recall from standard parsing theory that two derivations
which share the same parse tree are considered equivalent,
in the sense that they derive the same sentence,
in our case \Cw{}.
For our purposes,
we want to know if derivations
from the same parse tree
are equivalent in a stronger
sense.
The following theorem show that,
for two derivations from the same parse tree,
the sets of EIM validity equivalents are the same.

\begin{theorem}
\ttitle{EIM-derivation equivalence}
\label{t:derivation-eim-equivalence}
Let \Veim{eim} be an EIM,
and let \var{d1} and \var{d2} be two derivations
which share the same parse tree.
\Veim{eim} has a validity equivalent in \var{d1}
if and only if it has a validity equivalent in \var{d2}.
\end{theorem}

\begin{proof}
Because \var{d1} and \var{d2} are symmetric, we need
to show only the ``if'' direction.
We assume that
\Veim{eim} has a validity equivalent in \var{d1},
to show that it also has a validity equivalent in \var{d2}.
Let the EIM be
\begin{multline}
\label{eq:derivation-eim-equivalence-10}
   \Veim{eim} =
   \big[ [ \Vsym{A} \de \Vstr{prefix} \mydot \Vstr{suffix} ], \Vloc{i}, \Vloc{j} ] \\
\text{where $\Vstr{prefix} = \Vsym{C1} \Vsym{C2} \ldots \Vsym{Cn}$} \\
\text{and $\Vstr{suffix} = \Vsym{D1} \Vsym{D2} \ldots \Vsym{Dn}$}
\end{multline}
so that the validity equivalent of \Veim{eim} is
\begin{equation}
\label{eq:derivation-eim-equivalence-15}
    \Vsym{A} \derives \Vmk{i} \Vstr{prefix} \Vmk{j} \Vstr{suffix}
\end{equation}
Here
\eqref{eq:derivation-eim-equivalence-10} and
\eqref{eq:derivation-eim-equivalence-15}
are without loss of generality.
The corresponding node and direct descendants in the parse tree
will be
\[
\Tree [.A
  \Vsym{C1} \Vsym{C2} \ldots{} \Vsym{Cn}
  \Vsym{D1} \Vsym{D2} \ldots{} \Vsym{Dn}
]
\]
and since symbol instances in the parse tree are those
of \var{d1},
it remains the case that
\begin{equation}
\label{eq:derivation-eim-equivalence-20}
\Vsym{C1} \Vsym{C2} \ldots{} \Vsym{Cn} \destar \Cw[\var{i},(\Vdecr{j})]
\end{equation}

The order of the derivation in \var{d2} may differ from \var{d1}.
But
\eqref{eq:derivation-eim-equivalence-20} from the parse tree will continue
to hold in \var{d2};
and in \var{d2} there is some point at which \Vsym{A}
expands into its direct descendants.
Therefore
\eqref{eq:derivation-eim-equivalence-15}
holds for some derivation step in \var{d2}.
Since
\eqref{eq:derivation-eim-equivalence-15}
is unchanged,
it remains the validity equivalent of
\eqref{eq:derivation-eim-equivalence-10}.
Because \eqref{eq:derivation-eim-equivalence-10}
was chosen without loss of generality,
this shows the theorem.
\end{proof}

\begin{lemma}
\ltitle{EIM tether prediction}
\label{lem:eim-tether-prediction}
Let
$\Veim{prd} = \langle \var{s}, \var{rha1}, \var{rhz1}, 0\rangle$ be a prediction
expressed in terms of \var{d},
a derivation focused within \Veim{prd}.
Then \Veim{prd} has a top-down cause, \Veim{down},
such that,
for some
\var{rha2}, \var{rhz2}, \var{dot2},
we have
\begin{gather}
\label{lem:eim-tether-prediction-5}
\Veim{down} = \langle \Vdecr{s}, \var{rha2}, \var{rhz2}, \var{dot2}\rangle \\
\label{lem:eim-tether-prediction-8}
\text{and \var{d} is focused within \Veim{down}.}
\end{gather}
\end{lemma}

\begin{proof}
Since \Veim{prd} is a prediction, it is not the start EIM,
and therefore its LHS symbol is not \Vsym{accept}.
Without loss of generality, let
\begin{equation}
\label{lem:eim-tether-prediction-15}
\Veim{prd} = \big[ [ \Vsym{prd} \de \mydot \Vstr{prd-rhs} ], \Vloc{j}, \Vloc{j} \big]
\end{equation}
By assumption for the lemma, \var{d} is focused within \Veim{eim},
and it is at derivation step \var{s}.
So,
combining Theorem \ref{t:focusing-props} with
\eqref{lem:eim-tether-prediction-15},
we have
for some \Vloc{i}, \Vstr{pre} and \Vstr{post},
\begin{equation}
\label{lem:eim-tether-prediction-20}
\begin{aligned}
& \Vsym{down} && \text{Step \xxsubtract{\var{s}}{2}} \\
\derives \; & \Vmk{i} \Vstr{pre} \Vmk{j} \Vsym{prd} \Vstr{post} \qquad && \text{Step \Vdecr{s}} \\
\derives \; & \Vmk{i} \Vstr{pre} \Vmk{j} \Vsym{prd-rhs} \Vstr{post} \qquad && \text{Step \var{s}}
\end{aligned}
\end{equation}
and
\begin{equation}
\label{lem:eim-tether-prediction-23}
\text{\var{d} is focused within \Vsym{down}.}
\end{equation}

From
\eqref{lem:eim-tether-prediction-20},
we see that
$[\Vsym{down} \de \Vstr{pre} \Vsym{prd} \Vstr{post}]$ is a rule,
so that
\begin{equation}
\label{lem:eim-tether-prediction-24}
\Vdr{down} = [\Vsym{down} \de \Vstr{pre} \mydot \Vsym{prd} \Vstr{post}]
\end{equation}
is a
dotted rule
and one which is,
by the definition of top-down cause for dotted rules,
a top-down cause of \DR{\Veim{prd}}.
From this observation,
the assumption for this theorem that \Veim{prd} is a prediction,
and
\dref[causes of predicted EIM]{def:causes-predicted},
we see that
\begin{equation}
\label{lem:eim-tether-prediction-25a}
\begin{gathered}
\text{\Veim{down} is a top-down cause of \Veim{prd}} \\
\text{if} \quad \DR{\Veim{down}} = \Vdr{down} \\
\text{and} \quad \Current{\Veim{down}} = \Current{\Veim{prd}}.
\end{gathered}
\end{equation}

From
\eqref{lem:eim-tether-prediction-20}
and the definition of EIM validity,
we see that
\begin{gather}
\label{lem:eim-tether-prediction-26}
\Veim{down} = \big[ [ \Vsym{down} \de \Vstr{pre} \mydot \Vsym{prd} \Vstr{post} ], \Vloc{i}, \Vloc{j} \big]
\\
\text{and} \quad \Valid{\Veim{down}}.
\end{gather}

From
\eqref{lem:eim-tether-prediction-24}
and
\eqref{lem:eim-tether-prediction-26},
we have
\begin{equation}
\label{lem:eim-tether-prediction-26c}
\DR{\Veim{down}} = \Vdr{down}
\end{equation}

From
\eqref{lem:eim-tether-prediction-20}
and
\eqref{lem:eim-tether-prediction-26},
we have
\begin{align}
\label{lem:eim-tether-prediction-27a}
\Current{\Veim{down}} & = \Vloc{j} \\
\label{lem:eim-tether-prediction-27b}
& = \myfnname{Left}\big(\Vsym{prd}@(\Vdecr{s})\big) \\
\label{lem:eim-tether-prediction-27c}
& = \Left{\LHS{\Veim{prd}}} \\
\intertext{and because \Veim{prd} is a prediction}
\label{lem:eim-tether-prediction-27d}
\Current{\Veim{down}} & = \Current{\Veim{prd}}.
\end{align}

From
\eqref{lem:eim-tether-prediction-25a},
\eqref{lem:eim-tether-prediction-26c}
and
\eqref{lem:eim-tether-prediction-27d},
we can conclude that
\begin{equation}
\label{lem:eim-tether-prediction-30}
\text{\Veim{down} is a top-down cause of \Veim{prd}.}
\end{equation}

In 4-tuple representation, \Veim{down} is
for some \var{tbd},
\var{rha2}, \var{rhz2}, \var{dot2},
\begin{equation}
\label{lem:eim-tether-prediction-29}
\Veim{down} = \langle \var{tbd}, \var{rha2}, \var{rhz2}, \var{dot2}\rangle.
\end{equation}
We see from
\eqref{lem:eim-tether-prediction-20} that the LHS instance of \Veim{down}
is at Step \xxsubtract{\var{s}}{2},
and its RHS instance is at Step \Vdecr{s}.
The EIM has the same derivation step as its RHS instance,
so that
\eqref{lem:eim-tether-prediction-29}
becomes
\begin{equation}
\label{lem:eim-tether-prediction-33}
\Veim{down} = \langle \Vdecr{s}, \var{rha2}, \var{rhz2}, \var{dot2}\rangle.
\end{equation}
\eqref{lem:eim-tether-prediction-30}
and
\eqref{lem:eim-tether-prediction-33}
show
\eqref{lem:eim-tether-prediction-5}
in the statement of the lemma.

It remains to show
\eqref{lem:eim-tether-prediction-8}
in the statement of the lemma.
From
\eqref{lem:eim-tether-prediction-23},
we know that
\var{d} is focused in \LHS{\Veim{down}}.
By the definition of derivations focused within an EIM,
we have
\eqref{lem:eim-tether-prediction-8}
and the lemma.
\end{proof}

\begin{lemma}
\ltitle{EIM tether confirmation}
\label{lem:eim-tether-confirmation}
Let
\begin{equation}
\label{lem:eim-tether-confirmation-2}
\Veim{firm} = \langle \var{s}, \var{rha}, \var{rhz}, \var{dx}\rangle
\end{equation}
be a confirmed
EIM
expressed in terms of \var{d},
a derivation focused within \Veim{firm}.
Then \Veim{prd} has a top-down cause,
\begin{gather}
\label{lem:eim-tether-confirmation-5}
\Veim{down} = \langle \var{s}, \var{rha}, \var{rhz}, \Vdecr{dx}\rangle \\
\label{lem:eim-tether-confirmation-8}
\text{and \var{d} is focused within \Veim{down}.}
\end{gather}
\end{lemma}

\begin{proof}
Without loss of generality,
we write
\eqref{lem:eim-tether-confirmation-2}
in 3-tuple form as
\begin{equation}
\label{lem:eim-tether-confirmation-15}
\Veim{firm} = [ [ \Vsym{A} \de \Vstr{before} \cat \Vsym{up} \mydot \Vstr{after} ], \var{i}, \var{k} ].
\end{equation}
its predot symbol instance as
\begin{equation}
\label{lem:eim-tether-confirmation-18}
\Vmkl{j} \Vsym{up} \Vmkr{k}
\end{equation}
and
\Veim{down} as
\begin{equation}
\label{lem:eim-tether-confirmation-21}
\Veim{down} = [ [ \Vsym{A} \de \Vstr{before} \mydot \Vsym{up} \cat \Vstr{after} ], \var{i}, \var{j} ]
\end{equation}
where
by
Definition \ref{def:4-tuple-eim},
the definition of the 4-tuple notation for EIM's,
we have
\begin{gather}
\label{lem:eim-tether-confirmation-22}
\Vsym{A} = \Symbol{\drv{d}{\Vdecr{s}}{\var{rha}}} \\
\notag
\Vstr{before} = \Symbol{\drv{d}{\var{s}}{\, \var{rha} \; \ldots \; (\var{rha}+\Vdecr{dx}) \, }} \\
\notag
\Vsym{up} = \Symbol{\drv{d}{\var{s}}{\var{rha}+\var{dx}}} \quad \text{and} \\
\notag
\Vstr{after} = \Symbol{\drv{d}{\var{s}}{\, (\var{rha}+\var{dx}+1) \; \ldots \; \var{rhz} \, }}
\end{gather}
\eqref{lem:eim-tether-confirmation-21} is a top-down cause
of \Veim{firm}
\dref[causes of confirmed EIM]{def:causes-confirmed}.

Let our first draft of \Veim{down} take the fully general form
\begin{equation}
\label{lem:eim-tether-confirmation-27}
\Veim{down} = \langle \var{s2}, \var{rha2}, \var{rhz2}, \var{dx2}\rangle \\
\end{equation}
The symbol instances of the RHS for \Veim{down} are exactly those
of \Veim{firm}:
$\var{rha} = \var{rha2}$,
and
$\var{rhz} = \var{rhz2}$.
Since the symbol instances of the RHS are the same as those of \Veim{firm},
\Veim{down}'s RHS derivation step is also the same,
and therefore its EIM step is the same:
$\var{s} = \var{s2}$.
Finally, it is clear from comparision of
\eqref{lem:eim-tether-confirmation-15}
with
\eqref{lem:eim-tether-confirmation-21},
that
$\var{dx2} = \Vdecr{dx}$.
Collecting these results and substituting them in
\eqref{lem:eim-tether-confirmation-27},
we have
\begin{equation}
\label{lem:eim-tether-confirmation-35}
\Veim{down} = \langle \var{s}, \var{rha}, \var{rhz}, \Vdecr{dx}\rangle,
\end{equation}
which shows
\eqref{lem:eim-tether-confirmation-5}
in the statement of the lemma.

It remains to show
\eqref{lem:eim-tether-confirmation-8}
in the statement of the lemma.
If \var{d} is focused within \Veim{firm} then it is,
by the definition of a focused derivation for EIM's,
focused within its LHS symbol instance.
From
\eqref{lem:eim-tether-confirmation-2},
we see that
the LHS symbol instance of \Veim{firm}
is \drv{d}{\Vdecr{s}}{\var{rha}}
From
\eqref{lem:eim-tether-confirmation-22} we see that
the LHS symbol instance of \Veim{down} is also
\drv{d}{\Vdecr{s}}{\var{rha}}.
So \var{d} is focused within the LHS symbol instance of
\Veim{down},
and therefore
\var{d} is focused within \Veim{down}.
This shows
\eqref{lem:eim-tether-confirmation-8}.
\end{proof}

\begin{theorem}
\label{t:deriv-tether}
\ttitle{EIM tether}
Let
\begin{equation}
\label{t:deriv-tether-3}
\Veim{eim} = \big[ [ \Vsym{A} \derives \Vstr{predot} \mydot \Vstr{postdot} ],
\Vorig{i}, \Vloc{j} \big]
\end{equation}
Then
\begin{equation}
\label{t:deriv-tether-5}
\Vsym{A} \derives [\var{i}]\, \Vstr{predot} \,[\var{j}]\, \Vstr{postdot}
\end{equation}
if and only if
\begin{equation}
\label{t:deriv-tether-8}
\text{\Veim{eim} has a tether.}
\end{equation}
\end{theorem}

\begin{proof}
\textbf{The ``if'' direction}:
The ``if'' direction is easy to show.
We assume
\eqref{t:deriv-tether-8}
to show
\eqref{t:deriv-tether-5}.
If \Veim{eim} has a tether,
call it \var{teth},
then,
by the definition of a tether,
\Veim{eim} is \el{teth}{0}.
All elements of \var{teth} are valid
by
the assumption of
\eqref{t:deriv-tether-8}.
\eqref{t:deriv-tether-5}
follows from
\eqref{t:deriv-tether-3}
by EIM validity.
This shows the ``if'' direction.

\textbf{The ``only if'' direction}:
For ``only if'' direction,
we will
assume
\eqref{t:deriv-tether-5}
to show
\eqref{t:deriv-tether-8}.
To do this, we will first construct a
\var{teth} which has \Veim{eim}
as its base,
and then we will show that \var{teth}
satisfies Requirements~\eqref{eq:def-tether-10},
\eqref{eq:def-tether-20}
and
\eqref{eq:def-tether-30}
in Definition \ref{def:tether} (``tether'').

From
\eqref{t:deriv-tether-5}
and the definition of EIM validity,
we know that
\eqref{t:deriv-tether-3}
is valid.
We assume
\eqref{t:deriv-tether-5}
to be focused within \Veim{eim}.
We can do this without loss of generality,
because by Theorem
\ref{t:derivation-eim-equivalence},
every derivation has a
derivation focused at \Vloc{i} which validates
the same set of EIM's.

We construct \var{teth} using
the following algorithm:
\begin{algorithm}[tb]
\algtitle{Construct tether}{alg:construct-tether}
\begin{algorithmic}[1]
\Procedure{Construct tether}{}
\State $\el{teth}{0} \gets \Veim{eim}$
\label{line:eim-tether-10}
\State $\var{ix} \gets 0$
\While{ \Vel{teth}{ix} is not the start EIM }
\label{line:eim-tether-20}
\If{\Vel{teth}{ix} is a confirmed EIM}
\State Find \Veim{td}, top-down cause of \Vel{teth}{ix} \ldots
\State \ldots{} using Lemma \ref{lem:eim-tether-confirmation}
\Else
\State If here, \Vel{teth}{ix} is a prediction
\State Find \Veim{td}, top-down cause of \Vel{teth}{ix} \ldots
\State \ldots{} using Lemma \ref{lem:eim-tether-prediction}
\EndIf
\State $\el{teth}{\Vincr{ix}} \gets \Veim{td}$
\State $\var{ix} \gets \Vincr{ix}$
\EndWhile
\label{line:eim-tether-90}
\EndProcedure
\end{algorithmic}
\end{algorithm}

\textbf{``Only if'', first requirement}:
We have
\eqref{eq:def-tether-10},
trivially from
Line \ref{line:eim-tether-10}
of the above algorithm.

\textbf{``Only if'', second requirement}:
We show
\eqref{eq:def-tether-30}
by induction, where the induction hypothesis
is
\begin{gather}
\label{t:deriv-tether-20}
\text{\var{d} is focused within \Vel{teth}{x}} \\
\label{t:deriv-tether-22}
\text{and} \quad
\left(
\begin{gathered}
\var{x} = 0 \\
\text{or \Vel{teth}{x} is a top-down cause} \\
\text{of \Vel{teth}{\Vdecr{x}}}.
\end{gathered}
\right)
\end{gather}

We assumed that \var{d} is focused within
$\el{teth}{0} = \Veim{eim}$,
and we have
\eqref{t:deriv-tether-22} for $\var{x} = 0$
trivially.
We use this as the basis of the induction.

For the step of the induction we assume
\begin{equation}
\tag{STEP}
\label{t:deriv-tether-30}
\text{\eqref{t:deriv-tether-20} and \eqref{t:deriv-tether-22}
for $\var{x} = \var{i}$.}
\end{equation}
and we seek to show
\begin{equation}
\tag{GOAL}
\label{t:deriv-tether-35}
\text{
\eqref{t:deriv-tether-20} and \eqref{t:deriv-tether-22}
for $\var{x} = \Vincr{i}$.
}
\end{equation}
When \Vel{teth}{i} is a confirmed EIM,
\eqref{t:deriv-tether-35} follows from
\eqref{t:deriv-tether-30}
and Lemma \ref{lem:eim-tether-confirmation}.
When \Vel{teth}{i} is a predicted EIM,
\eqref{t:deriv-tether-35} follows from
\eqref{t:deriv-tether-30}
and Lemma \ref{lem:eim-tether-prediction}.
This shows the step of the induction,
the induction,
and
\eqref{eq:def-tether-30}.

\textbf{``Only if'', third requirement}:
It remains to show
\eqref{eq:def-tether-20}.
From Line
\ref{line:eim-tether-20}
of the algorithm, we see that we stop
only when and if we find a start EIM.
So if we stop,
and \var{top} is the last index of \var{teth},
then \Vel{teth}{top} is the start EIM.
But do we ever stop?

We will count the number of EIM's in the tether.
They fall into three categories:
the start EIM,
predicted EIM's,
and confirmed EIM's,
whose count we will write as,
respectively \var{s-cnt},
\var{p-cnt},
and
\var{c-cnt}.
It will be most convenient to count EIM's,
not as they are added,
but as they are processed in a pass of the
loop from Lines
\ref{line:eim-tether-20}--\ref{line:eim-tether-90}
of our ``Construct tether'' algorithm.
From
Line \ref{line:eim-tether-20},
we see that
only one start EIM
is ever processed:
\begin{equation}
\label{t:deriv-tether-40}
\var{s-cnt} = 1.
\end{equation}
We note from
Lemma \ref{lem:eim-tether-prediction},
that every time we process a prediction in \var{teth},
the derivation step is decremented in the next
and examination of
Lemma \ref{lem:eim-tether-confirmation}
shows that the derivation step is never incremented.
Recall that the length of every derivation is
a finite constant ---
even a derivation of the form $\Vstr{A} \destar \Vstr{B}$
signifies that there exists some finite \var{k}
such that $\Vstr{A} \xderives{\var{k}} \Vstr{B}$.
So we know that
$\var{p-cnt} = \var{k}$ for some finite \var{k},
and therefore
\begin{equation}
\label{t:deriv-tether-43}
\var{p-cnt} = \Oc.
\end{equation}

Finally, we examine the confirmations.
Call the maximum length of a RHS, \var{maxrh}.
\var{maxrh} is a constant which depends on \Cg.
We see from
Lemma \ref{lem:eim-tether-confirmation}
that the dot index is decremented every
time a confirmation is processed.
But Lemma \ref{lem:eim-tether-prediction}
resets the dot index
every time a prediction is processed,
possibly to as high as
\var{maxrh}.
So the number of confirmations may be as great as
\begin{equation}
\label{t:deriv-tether-46}
\var{c-cnt} = \var{maxrh} \times \var{p-cnt}.
\end{equation}
\var{maxrh} is a constant,
so that, using \eqref{t:deriv-tether-43},
\eqref{t:deriv-tether-46}
becomes
\begin{equation}
\label{t:deriv-tether-49}
\var{c-cnt} = \Oc.
\end{equation}
Combining
\eqref{t:deriv-tether-40},
\eqref{t:deriv-tether-43}
and
\eqref{t:deriv-tether-49},
we see that the total number of tether EIM's is
\begin{equation}
\var{s-cnt} + \var{p-cnt} + \var{c-cnt} =
1 + \Oc + \Oc = \Oc.
\end{equation}

We have shown that the construction of the tether does,
indeed, stop.
With this we have shown
\eqref{eq:def-tether-20}
and the theorem.
\end{proof}

\begin{theorem}
\label{t:eim-tether}
\ttitle{EIM tether}
If \Veim{eim} is valid,
it has a tether.
\end{theorem}

\begin{proof}
Without loss of generality, let
\begin{equation}
\label{t:eim-tether-3}
\Veim{eim} = \big[ [ \Vsym{A} \derives \Vstr{predot} \mydot \Vstr{postdot} ],
\Vorig{i}, \Vloc{j} \big]
\end{equation}
Since, by assumption for the theorem, \Veim{eim} is valid,
we have
\begin{equation}
\label{t:eim-tether-5}
\Vsym{A} \derives [\var{i}]\, \Vstr{predot} \,[\var{j}]\, \Vstr{postdot}
\end{equation}
This theorem follows from
\eqref{t:eim-tether-5} and
Theorem \ref{t:deriv-tether}
\end{proof}

If \var{hi} and \var{lo} are
tether indexes such that $\var{hi} > \var{lo}$,
we say that \Vel{teth}{lo} is
\xdfn{below}{below!in a tether}
\Vel{teth}{hi};
and that the direction from
\Vel{teth}{hi} to
\Vel{teth}{lo} is
\xdfn{downward}{downward!in a tether}.

\begin{theorem}
\ttitle{Tether non-decreasing location}
\label{t:non-decreasing-location}
If we follow a tether downward,
the right locations of its elements are non-decreasing:
\begin{equation}
\var{lo} < \var{hi}
\implies \Right{\Vel{teth}{lo}} \ge \Right{\Vel{teth}{hi}}
\end{equation}
\end{theorem}

\begin{proof}
By examining
the cases of Theorem
\ref{t:right-location-of-top-down-cause},
we see
that the right location of an effect
is never less than the right location of its
top-down cause.
\end{proof}

\begin{theorem}
\ttitle{Location 0 Earley items}
\label{t:location-0-eims}
A EIM is valid at location 0 if and only if it
is in the ethereal closure of the start EIM.
\end{theorem}

\begin{proof}
Let \var{ecs} be the ethereal closure of the
start EIM.
We first show
the ``if'' direction.
We assume that an EIM is in \var{ecs} to show that
it is at location 0.
The start EIM is by definition at location 0.
Any other EIM in \var{ecs} is produced by iterating
\var{epsilon-op}.
As can be seen from
Theorem
\ref{t:right-location-of-top-down-cause},
an \var{epsilon-op} does not increment the right location
of its argument.
Therefore every EIM in the ethereal closure of the start
EIM will be at location 0.

It remains to
show the ``only if'' direction.
We assume that an EIM, call it \Veim{eim},
is at location 0.
We seek
to show that \Veim{eim} is in \var{ecs}.
By Theorem \ref{t:eim-tether},
every EIM has a tether,
so every EIM at location 0 has a tether.
By Theorem
\ref{t:non-decreasing-location}
locations in a tether are non-decreasing
so that every element of the tether of \Veim{eim}
must be at location zero.
We note from
Theorem
\ref{t:right-location-of-top-down-cause},
that the reduction and read EIM's have a location
greater than that of their top-down cause,
and therefore other than 0.
So the tether of \Veim{eim} can contain only null-scans,
predictions, and the start EIM.
By its definition, the tether starts with its top
element, the start EIM.
Therefore \Veim{eim} is the result of the iteration
of epsilon operations,
beginning with the start EIM.
By the definition of ethereal closure, any EIM
that is the result of iterating epsilon operations
on a telluric base is
in the ethereal closure of that telluric base.
So \Veim{eim} is in the ethereal closure of the
start EIM, or \var{ecs}.
\end{proof}

\begin{theorem}
\ttitle{Earley item has telluric base at same location}
\label{t:eim-has-telluric-base}
Let \Veim{desc} be a valid EIM at location
\Vloc{i}.
Then \Veim{desc} has a telluric base,
\Veim{base}, such that
$\Current{\Veim{base}} = \Vloc{i}$.
\end{theorem}

\begin{proof}
We consider first, as a special case,
location 0.
By Theorem \ref{t:location-0-eims},
all EIM's at location 0
are in the ethereal closure of the start EIM,
call it \var{ecs}.
The telluric base of \var{ecs} is the start
EIM, and it is at location 0.

We now consider the case
locations greater than 0.
By Theorem \ref{t:eim-tether}
\Veim{base} has a tether,
call it \var{teth}.
By definition of the tether, its top element has right
location 0.
By assumption for this case,
\Veim{desc} has a right location greater than 0.
Let \Current{\Veim{desc}} be \Vloc{i}.
If we descend
\var{teth} from the its top element,
we will encounter a first element of \var{teth} at \Vloc{i}.
Call this first element, $\Veim{base} = \Vel{teth}{base-ix}$.

\Veim{base} will not be the top element
because the top element is at location 0,
which by assumption for the case is not location \Vloc{i}.
Therefore there will be a tether element above it,
\el{teth}{\Vdecr{base-ix}}.
Call
\el{teth}{\Vdecr{base-ix}}, \Veim{prev}.
\Veim{prev} will not be at \Vloc{i}, otherwise it would
have been the first tether element encountered at \Vloc{i}.
So we have
\begin{equation}
\label{eq:eim-has-telluric-base-20}
\Right{\Veim{prev}} \neq \Right{\Veim{base}}.
\end{equation}
From
\eqref{eq:eim-has-telluric-base-20},
and Theorem
\ref{t:right-location-of-top-down-cause},
we know that \Veim{base} is not a null-scan
or a prediction.
Therefore
\begin{equation}
\label{eq:eim-has-telluric-base-25}
\text{\Veim{base} is a telluric EIM.}
\end{equation}

We choose
\Veim{base} in such a way that
\[
  \Right{\Veim{base}} = \Right{\Veim{desc}},
\]
and \Veim{base} is on \var{teth} above \Veim{desc}.
So there is a series of zero or more top-down causes
from \Veim{base} to \Veim{desc}.
Let the tether index of \Veim{desc} be \var{desc-ix}.
Since right location is non-decreasing,
every EIM with an index \var{ix}
such that
\[
\var{base-ix} > \var{ix} \ge \var{desc-ix}
\]
must not increase the right location
from that of its top-down cause.
Therefore,
\begin{equation}
\label{eq:eim-has-telluric-base-35}
\Current{\Veim{base}} = \Current{\Veim{desc}}.
\end{equation}
Together,
\eqref{eq:eim-has-telluric-base-25}
and
\eqref{eq:eim-has-telluric-base-35}
show the theorem.
\end{proof}

\chapter{Earley tables}
\label{ch:earley-tables}

In the context of a specific \Cg{},
a specific \Cw{},
and a specific Earley implementation,
an Earley parser builds a table of Earley sets,
\Ctables.
Let \alg{Impl} be an Earley implementation.
In contexts where it is not clear
which implementation is being referred to,
we say \Vtables{Impl}
when we are referring to the tables of \alg{Impl}.
For example, the tables for the Marpa
are \Vtables{Marpa}.

Traditionally, the tables of an Earley algorithm
are grouped into sets,
one \dfn{Earley set} for each location of \Cw{}:
\begin{equation*}
\EVtable{\alg{Impl}}{i},
\quad \text{where} \quad
0 \le \Vloc{i} \le \size{\Cw}.
\end{equation*}
Earley sets are of type \dtype{ES}.
Earley sets are often named by their location,
so that \Ves{i} means the Earley set at \Vloc{i}.
The type designator \type{ES} is often omitted to avoid clutter,
especially in cases where the Earley set is not
named by location.

\EVtable{\alg{Impl}}{i} will be
the Earley set at \Vloc{i}
in the table of Earley sets of
the \alg{Impl} implementation.
For example,
\EVtable{\Marpa}{j} will be Earley set \Vloc{j}
in \Marpa's table of Earley sets.
In contexts where it is clear which recognizer is
intended,
\Vtable{k}, or \Ves{k}, will symbolize Earley set \Vloc{k}
in that recognizer's table of Earley sets.
If \Ees{\var{working}} is an Earley set,
$\size{\Ees{\var{working}}}$%
\index{recce-notation}{\Pipe{}es\Pipe{}@\Vsize{es} (size of an Earley set)}
is the number of Earley items
in \Ees{\var{working}}.

\Rtablesize{\alg{Recce}} is the total number
of Earley items in all Earley sets for \alg{Recce},
\begin{equation*}
\Rtablesize{\alg{Recce}} =
     \sum\limits_{\Vloc{i}=0}^{\size{\Cw}}
  {\bigsize{\EVtable{\alg{Recce}}{i}}}.
\end{equation*}
For example,
\Rtablesize{\Marpa} is the total number
of Earley items in all the Earley sets of
a \Marpa{} parse.

An Earley item may be memoized.
An Earley item is \dfn{memoized}
if and only if it is
not kept in an Earley set,
but is kept in a form from which it can be recovered.
Chapter \ref{ch:leo}
will show one way in which Earley items
can be memoized.
To say that \Veim{x} is memoized,
we also say \Memoized{\Veim{x}}.%
\index{recce-notation}{Memoized(x)@\Memoized{\var{eim}}}

A set of EIM's (not necessarily an Earley set)
is \dfn{consistent} if and only if all of its
EIM's are valid and unmemoized.
For example,
the Earley set \Ves{i}
is \dfn{consistent} if and only if
every EIM in the Earley set at \Vloc{i}
is valid and unmemoized:
\begin{equation}
\label{eq:def-complete-1}
\Veim{eim} \in \Veimset{x} \implies \Valid{\Veim{eim}} \land \neg \Memoized{\var{eim}}
\end{equation}

Let \Veimset{x} be a set of EIM's.
\Veimset{x} is not necessary an Earley set.
We say that
\Veimset{x} is \dfn{complete} for a predicate \var{phi},
if and only if,
for all \Veim{eim},
\begin{equation}
\label{eq:def-complete-2}
\begin{split}
& \Valid{\Veim{eim}} \land \neg \Memoized{\var{eim}} \land \var{phi}(\var{eim}) \\
& \qquad \qquad \implies \Veim{eim} \in \Veimset{x}.
\end{split}
\end{equation}
If we say that an EIM set, \Veimset{x},
is \dfn{self-complete},
then \var{phi} is membership in \Veimset{x}:
\[ \lambda \Veim{eim} . \var{eim} \in \Veimset{x}, \]
so that
\eqref{eq:def-complete-2} simplifies to
\begin{equation}
\label{eq:def-complete-4}
\begin{split}
& \Valid{\Veim{eim}} \land \neg \Memoized{\var{eim}} \\
& \qquad \qquad \implies \Veim{eim} \in \Veimset{x}.
\end{split}
\end{equation}

For example,
the EIM set \Veimset{x} is complete
for the predicate
\begin{equation}
\label{eq:def-complete-6}
\lambda \var{eim} . \Current{\Veim{eim}} = \Vloc{i}
\end{equation}
if and only if,
for all \Veim{eim},
\begin{equation*}
\begin{split}
& \Valid{\Veim{eim}} \land \neg \Memoized{\var{eim}} \land \Current{\var{eim}} = \Vloc{i} \\
& \qquad \qquad \implies \Veim{eim} \in \Veimset{x}.
\end{split}
\end{equation*}
If $\Veimset{x} = \Ves{i}$, then
saying that \Ves{i} is complete for
\eqref{eq:def-complete-6}
is the same as saying that
\Ves{i} is self-complete.

We say that
\Veimset{x} is \dfn{correct} for a predicate \var{phi},
if and only if it is consistent
and complete for a predicate \var{phi}.
We say that
\Veimset{x} is \dfn{self-correct},
if and only if it is consistent
and self-complete.

We often say that an EIM set is complete or correct,
in a context where no predicate is specified.
In that case,
we mean that the EIM set is self-complete or self-correct.

We call
\begin{equation}
\Veim{accept} = [\Vdr{accept}, 0, \Vsize{\Cw}]
\end{equation}
the \dfn{accept EIM}.
Let \alg{Impl} be an Earley implementation.
We say that \alg{Impl}
\dfn{accepts} an input
if and only if \Veim{accept} is in its Earley tables:
\begin{equation}
\label{eq:def-implementation-accepts-10}
\myL{\alg{Impl},\Cg}
\defined
\Veim{accept} \in \Vtables{Impl}
\end{equation}
We say that an Earley implementation is \dfn{correct} if and only
if the set of strings it accepts is exactly the set of
strings in the language of its grammar.

\begin{theorem}\label{t:algorithm-correct}
\ttitle{Earley implementation correctness}
If, for a given Earley implementation,
\begin{equation}
\label{eq:algorithm-correct-1}
\text{\Ves{\Vsize{\Cw}} is correct,}
\end{equation}
then
that implementation accepts all and only the
correct inputs:
\begin{equation}
\label{eq:algorithm-correct-2}
[\Vdr{accept}, 0] \in \bigEtable{\Vsize{\Cw}} \; \equiv \; \Cw \in \var{L}(\Cg).
\end{equation}
\end{theorem}

\begin{proof}
We prove the forward direction of the equivalence first.
We assume that
\begin{equation}
\label{eq:algorithm-correct-3}
[\Vdr{accept}, 0] \in \bigEtable{\Vsize{\Cw}}.
\end{equation}
By \eqref{eq:algorithm-correct-1},
\Ves{\Vsize{\Cw}} is correct.
Therefore,
by \eqref{eq:algorithm-correct-3},
the definition of validity for an Earley item,
and the definition of the accept rule \eqref{eq:accept-rule-def-10},
\begin{equation}
\label{eq:algorithm-correct-6}
\begin{split}
& \Vsym{accept} \destar \mk{0} \Vsym{start} \mk{\Vsize{\Cw}}
\end{split}
\end{equation}
By the definition of the location markers,
\eqref{eq:algorithm-correct-6}
means that
\begin{equation}
\label{eq:algorithm-correct-15}
\Vstr{accept} \destar \var{w}[\var{0}, \Vsize{\Cw} \subtract 1] \destar \Cw.
\end{equation}
From
\eqref{eq:algorithm-correct-15},
by the definition of \Cw{},
we have that
\begin{equation}
\label{eq:algorithm-correct-27}
\Cw \in \var{L}(\Cg).
\end{equation}
This shows the forward direction of the equivalence.

To show the reverse direction of the equivalence, we assume
\eqref{eq:algorithm-correct-27}.
From it,
the definition of the \Vsym{accept} symbol,
and the definition of $\var{L}(\Cg)$,
we have
\eqref{eq:algorithm-correct-15}.
By the definition of the \Vsym{accept} symbol,
it is only on the LHS of the accept rule,
so that we have
\begin{equation}
\label{eq:algorithm-correct-40}
\Vsym{accept} \derives [0]\, \Vsym{start} \,[\Vsize{\Cw}] \destar \Cw.
\end{equation}
By assumption for the theorem, the Earley set at
\Vsize{\Cw} is correct and therefore complete.
If the Earley set at \Vsize{\Cw} is complete,
by \eqref{eq:algorithm-correct-40}
and the definition of validity for Earley items,
we have
\begin{equation}
\label{eq:algorithm-correct-46}
[\Vdr{accept}, 0] \in \bigEtable{\Vsize{\Cw}}.
\end{equation}
This shows the reverse direction of the equivalence.
We have now shown both directions of the equivalence,
and therefore the theorem.
\end{proof}

\begin{theorem}
\ttitle{Earley set size}
\label{t:es-count}
The size of the Earley set at \Vloc{i} is,
worst case, $\order{\var{i}}$:
\begin{equation*}
\textup{
    $\bigsize{\EVtable{\Marpa}{i}} = \order{\var{i}}$.
}
\end{equation*}
\end{theorem}

\begin{proof}
EIM's have the form $[\Vdr{x}, \Vorig{x}]$.
\Vorig{x} is the origin of the EIM,
which in Marpa cannot be after the current
Earley set  at \Vloc{i},
so that
\begin{equation*}
0 \le \Vorig{x} \le \Vloc{i}.
\end{equation*}
The number of possible values for \Vdr{x}
is the count of dotted rules in \Cg{}.
Call that count, $\size{\Cdr}$.
$\size{\Cdr}$
is a finite constant that depends on the grammar,
\Cg{}.
Since duplicate EIM's are never added to an Earley set,
the maximum size of Earley set \Vloc{i} is therefore
\begin{equation*}
\Vloc{i} \times \size{\Cdr} = \order{\Vloc{i}}.\qedhere
\end{equation*}
\end{proof}

\chapter{Silos}
\label{ch:silos}

\begin{definition}
\dtitle{Silo}
\label{def:silo}
A dotted rule is
\xdfn{silo-eligible}{silo-eligible (dotted rule)}
if and only if it is quasi-complete.
An Earley item
is
\xdfn{silo-eligible}{silo-eligible (EIM)}
if and only
if its dotted rule is silo-eligible.
We say that an EIM, call it \Veim{cuz},
is the \dfn{silo cause} of another EIM,
call it \Veim{effect},
if and only if
\begin{itemize}
\item
\Veim{cuz} and \Veim{effect}
are silo-eligible,
\item
$\Right{\Veim{cuz}} = \Right{\Veim{effect}}$,
and
\item
\Veim{cuz} is a top-down or bottom-up cause
of \Veim{effect}.
\end{itemize}
If \Veim{cuz} is the
\dfn{silo cause}
of \Veim{effect},
we say that \Veim{effect} is the
\dfn{silo effect}
of \Veim{cuz}.

A \dfn{silo},
call it \var{s1},
is a sequence of EIM's,
where
\Vel{s1}{\var{i}} is the silo cause of
\el{s1}{\Vincr{i}}.
\end{definition}

We write \Vop{Silo}{slo} to indicate that \var{slo}
is a silo.%
\index{recce-notation}{Silo(slo)@\Vop{Silo}{slo}}
This definition implies that any subsequence of a silo
is also a silo:
\[
    \Vop{Silo}{sl1} \; \land \; \var{sl2} \subseteq \var{sl1}
  \implies \Vop{Silo}{sl2}
\]
Also, if any two overlapping silos are merged,
the result will be a silo.

We call an element of a silo,
a
\xdfn{layer}{layer (EIM)!wrt a silo}.
We write \Vsize{\var{s1}}%
\index{recce-notation}{\Pipe{}silo\Pipe{}@\Vsize{silo} (size of a silo)}
for the number
of elements in silo \var{s1}.
Our indexing convention is to use
consecutive non-negative integers for silo layers,
started at zero.
\el{s1}{0}
is called the
\xdfn{bottom}{bottom (EIM)!wrt a silo}
of \var{s1},
and
$\var{s1}\big[ \, \Vlastix{s1} \, \big]$
is the
\xdfn{top}{top (EIM)!wrt a silo}
of \var{s1}.

\begin{theorem}
\ttitle{Silo location uniqueness}
\label{t:silo-location}
Let \Vel{silo}{i}
and
\Vel{silo}{j}
be two layers of a silo.
Then
\begin{equation}
\label{eq:silo-location-4}
\Right{\Vel{silo}{i}} =
\Right{\Vel{silo}{j}}.
\end{equation}
\end{theorem}

\begin{proof}
We first will show that
\begin{equation}
\label{eq:silo-location-7}
\begin{gathered}
\forall \var{x} :
0 \le \var{x}
\le \Vel{silo}{\Vlastix{silo}} \\
\implies
\Right{\Vel{silo}{0}} =
\Right{\Vel{silo}{x}}.
\end{gathered}
\end{equation}
The proof
of \eqref{eq:silo-location-7}
is by induction.
We take as the induction hypothesis,
\begin{equation}
\tag{IND}
\label{eq:silo-location-10}
\Right{\el{silo}{0}} =
\Right{\Vel{silo}{x}}
\end{equation}
We have
\eqref{eq:silo-location-10}
trivially if $\var{x} = 0$,
and we use this as the basis of
the induction.

For the step, we assume
\eqref{eq:silo-location-10}
for $\var{x} = \var{i}$
to show
\eqref{eq:silo-location-10}
for $\var{x} = \Vincr{i}$.
We know that
\Vel{silo}{i}
is the silo cause of
\Vel{silo}{\Vincr{i}}.
By the definition of a silo cause,
then
\begin{equation}
\label{eq:silo-location-13}
\Right{\Vel{silo}{i}} =
\Right{\el{silo}{\Vincr{i}}}
\end{equation}
The assumption for the step is that
\begin{equation}
\label{eq:silo-location-16}
\Right{\el{silo}{0}} =
\Right{\el{silo}{\var{i}}}
\end{equation}
and from
\eqref{eq:silo-location-13}
and \eqref{eq:silo-location-16}
we have
\begin{equation}
\label{eq:silo-location-17}
\Right{\el{silo}{0}} =
\Right{\el{silo}{\Vincr{i}}},
\end{equation}
which shows the step, the induction and
\eqref{eq:silo-location-7}.

It remains to show
\eqref{eq:silo-location-4}.
\begin{align}
\label{eq:silo-location-19}
&
\Right{\el{silo}{0}} =
\Right{\Vel{silo}{i}}
&& \eqref{eq:silo-location-7}
\\
\label{eq:silo-location-22}
&
\Right{\el{silo}{0}} =
\Right{\Vel{silo}{j}}
&& \eqref{eq:silo-location-7}
\\
\label{eq:silo-location-25}
&
\Right{\Vel{silo}{i}} =
\Right{\Vel{silo}{j}}
&& \eqref{eq:silo-location-19},
\eqref{eq:silo-location-22}
\end{align}
\eqref{eq:silo-location-25} is
\eqref{eq:silo-location-4},
which shows the theorem.
\end{proof}

We say that \Right{\Vel{sil}{0}}
is the
\xdfn{location}{location!wrt a silo}
of the silo \var{sil}.
From Theorem
\ref{t:silo-location}
we know that the location of the silo will
be the right location of each of its layers.
We also write the
location of silo \var{sil}
as \Right{\var{sil}}.%
\index{recce-notation}{Right(silo)@\Right{\var{silo}}}

\begin{theorem}
\label{t:silo-causes}
\ttitle{Silo causes}
Every silo layer
\begin{itemize}
\item
is a read EIM,
and has no bottom-up or
top-down causes;
\item
is a null-scan EIM and
has at least one top-down silo cause
and no bottom-up silo causes; or
\item
is a reduction EIM and
has at least one bottom-up silo cause
and no top-down silo causes.
\end{itemize}
\end{theorem}

\begin{proof}
\textbf{Read EIM}:
Let \Veim{rd} be a quasi-complete read EIM.
By the definition of causes,
we know that
the bottom-up cause of \Veim{rd} has
no EIM equivalent and therefore is not
a silo cause.
Let \Veim{down} be the top-down cause of a
read EIM.
From Theorem
\ref{t:down-cause-from-effect},
we know that
\begin{align}
\notag
& \Right{\Veim{down}} = \decr{\Right{\Veim{rd}}} \\
\label{eq:silo-causes-20}
\therefore \;\; & \Right{\Veim{down}} \neq \Right{\Veim{rd}}.
\end{align}
\eqref{eq:silo-causes-20} shows that \Veim{down}
cannot be a silo cause of \Veim{rd}.

\textbf{Null-scan EIM}:
Let \Veim{ns} be a quasi-complete null-scan EIM.
By the definition of causes,
we know that
the bottom-up cause of \Veim{ns} has
no EIM equivalent and therefore is not
a silo cause.
Let \Veim{down} be the top-down cause of a
read EIM.
From Theorem
\ref{t:down-cause-from-effect},
we know that
\begin{equation}
\label{eq:silo-causes-30}
\myparbox{$\Right{\Veim{down}} = \Right{\Veim{ns}}.$}
\end{equation}
The only symbol between the dot index of \Veim{down}
and the dot index of \Veim{ns} is,
by the definition of a null-scan EIM,
a nulling symbol,
so that if the dot suffix of \Veim{ns} contains
only nulling symbols,
the dot suffix of \Veim{ns} must also contain
only nulling symbols.
Therefore
\begin{equation}
\label{eq:silo-causes-33}
\myparbox{\Veim{down} is quasi-complete.}
\end{equation}
From
\eqref{eq:silo-causes-30}
and
\eqref{eq:silo-causes-33},
we see that
\Veim{down} is a silo cause
of \Veim{ns}.

\textbf{Reduction EIM}:
Let \Veim{duct} be a quasi-complete reduction EIM,
let its top-down cause be \Veim{down}
and let the EIM equivalent of
its bottom-up cause be \Veim{up}.
By the definition of causes,
we know that
\begin{gather}
\label{eq:silo-causes-36a}
\myparbox{
the bottom-up cause of \Veim{duct} is
a complete EIM,
and is therefore a quasi-complete EIM;
} \\
\label{eq:silo-causes-36c}
\myparbox{
$\Right{\Veim{up}} = \Right{\Veim{duct}}.$
}
\end{gather}
From
\eqref{eq:silo-causes-36a}
and
\eqref{eq:silo-causes-36c},
we see that
\Veim{up}
is
a silo cause of \Veim{duct}.

From Theorem
\ref{t:down-cause-from-effect},
we know that
\begin{align}
\notag
& \Right{\Veim{down}} < \Right{\Veim{rd}} \\
\label{eq:silo-causes-40}
\therefore \quad &  \Right{\Veim{down}} \neq \Right{\Veim{rd}}
\end{align}
\eqref{eq:silo-causes-40} shows that \Veim{down}
cannot be a silo cause of \Veim{rd}.

\textbf{Prediction EIM}:
By Theorem \ref{t:quasi-drs-disjoint},
we see that a prediction is never quasi-complete,
and therefore can never be a silo layer.

\textbf{Start EIM}:
By its definition, the start EIM has a telluric
symbol in its dot suffix,
and therefore is not quasi-complete.
For this reason,
the start EIM is never a silo layer.
\end{proof}

\begin{lemma}
\ttitle{Read EIM silo layer properties}
\label{t:silo-read-eim-layer}
Let a silo layer, call it \Vel{silo}{i}, be a read EIM.
Then
\begin{gather}
\label{eq:silo-read-eim-layer-1}
\var{i} = 0,
\\
\\
\label{eq:silo-read-eim-layer-3}
\Vel{silo}{i} = \Vel{silo}{j} \implies \var{i} = \var{j}.
\end{gather}
\end{lemma}

\begin{proof}
Let \Vel{silo}{x} be a read EIM.
By Theorem
\ref{t:silo-causes},
it has no causes,
and therefore by the definition of
a silo,
there is no silo layer
\Vel{silo}{\Vdecr{x}}.
Our indexing convention is that 0 is the
numerically the lowest index of the silo.
This shows
\eqref{eq:silo-read-eim-layer-1}.
\end{proof}

\begin{theorem}
\ttitle{Silo layer telluric prefix}
\label{t:silo-telluric-prefix}
Every layer of a silo at \Vloc{k} has a telluric symbol before
\Vloc{k}.
\end{theorem}

\begin{proof}
A silo layer must be quasi-complete,
and no EIM in Marpa is nulling,
so that there must be a telluric symbol before \Vloc{k}.
\end{proof}

\begin{theorem}
\ttitle{No location 0 silo}
\label{t:no-silo-at-0}
There are no silos at location 0.
\end{theorem}

\begin{proof}
From theorem \ref{t:silo-telluric-prefix},
there must be a telluric symbol before \Vloc{k}.
Therefore, without loss of generality, a silo layer is
\begin{equation}
\label{eq:no-silo-at-0-10}
\big[ [ \Vsym{A} \de \Vstr{fore} \Vsym{tell} \mydot \Vstr{suffix} ], \Vloc{i}, \Vloc{k} \big]
\end{equation}
for some \Vloc{i},
and some rule
\[
  [ \Vsym{A} \de \Vstr{fore} \Vsym{tell} \Vstr{suffix} ] \in \Crules
\]
where \Vsym{tell} is telluric.
By the definition of EIM validity, we know that
\begin{align}
& \Vmk{i} \Vstr{fore} \Vsym{tell} \Vmk{k} &&
  \text{\eqref{eq:no-silo-at-0-10}}
\notag
\\
\label{eq:no-silo-at-0-16}
\therefore \quad & \var{k} \ge \var{i} + \Vsize{\Vsym{tell}} &&
\\
\label{eq:no-silo-at-0-17}
  & \Vsize{\Vsym{tell}} \ge 1 &&
\text{\Vsym{tell} is telluric}
\intertext{and because parse locations are non-negative integers,}
& \var{i} \ge 0  &&
\notag
\\
\therefore \quad & \var{k} \ge 0 + \Vsize{\Vsym{tell}} &&
\text{\eqref{eq:no-silo-at-0-16}}
\notag
\\
\therefore \quad & \var{k} \ge 0 + 1 &&
\text{\eqref{eq:no-silo-at-0-17}}
\notag
\\
\label{eq:no-silo-at-0-27}
\therefore \quad & \Vloc{k} \ge 1 &&
\end{align}
\eqref{eq:no-silo-at-0-10} was stated without loss of generality,
so that
\eqref{eq:no-silo-at-0-27} shows the theorem.
\end{proof}

\begin{theorem}
\ttitle{Silo layer predot}
\label{t:silo-predot}
Let \Vloc{k} be the location of a silo.
Every layer of the silo has a symbol before \Vloc{k}.
\end{theorem}

\begin{proof}
This theorem follows
directly from Theorem
\ref{t:silo-telluric-prefix}.
\end{proof}

\begin{theorem}
\ttitle{Consecutive silo incomplete EIM's}
\label{t:consecutive-silo-incompletes}
No run of consecutive incomplete silo layers
is longer than \var{c},
where \var{c} is a constant which depends on
the grammar.
\end{theorem}

\begin{proof}
Let \var{slo} be a silo, and
let
\begin{equation}
\label{eq:consecutive-silo-incompletes-5}
\Vel{slo}{x} \; \text{be an incomplete silo layer.}
\end{equation}
Since every silo layer is quasi-complete,
we know that $\Postdot{\Vel{slo}{x}} = \epsilon$,
so that
\begin{align}
\label{eq:consecutive-silo-incompletes-10a}
& \Predot{\el{slo}{\Vincr{x}}} = \epsilon
\\
\label{eq:consecutive-silo-incompletes-10c}
& \text{\el{slo}{\Vincr{x}} is a null-scan
   $\because$ \eqref{eq:consecutive-silo-incompletes-10a}
}
\\
\label{eq:consecutive-silo-incompletes-10e}
& \text{\el{slo}{\var{x}} is top-down cause of
  \el{slo}{\Vincr{x}}
  $\because$ \eqref{eq:consecutive-silo-incompletes-10c},
    \tref{t:silo-causes},
}
\\
&
\begin{multlined}
\el{slo}{\Vincr{x}} = \op{null-scan-op}{\el{slo}{\var{x}}} \\
   \because
    \eqref{eq:consecutive-silo-incompletes-10c},
    \eqref{eq:consecutive-silo-incompletes-10e},
    \; \text{Def of \myfnname{null-scan-op}}
\end{multlined}
\end{align}
In the above, \var{x} was chosen without loss of generality,
so that a sequence of incomplete silo layers is an iterated
sequence of \myfnname{null-scan-op} arguments.
Let the sequence of incomplete silo layers be
$\el{slo}{\var{x} \ldots \var{y}}$
where $\var{y} \ge \var{x}$.
By the definition of a fleeting closure,
\el{slo}{\var{x} \ldots \var{y}} is part of a fleeting closure
whose first element is \Vel{slo}{x}.
\eqref{eq:quasi-complete-fleeting-closure-properties-9}
of Theorem \ref{t:quasi-complete-fleeting-closure-properties}
sets a maximum limit to the size of a fleeting closure whose
first element is a quasi-complete EIM,
so that,
recalling \eqref{eq:consecutive-silo-incompletes-5},
we see that the fleeting closure containing
\el{slo}{\var{x} \ldots \var{y}} has at most
\Vsize{\Rule{\Vel{slo}{x}}} elements.
Therefore,
\el{slo}{\var{x} \ldots \var{y}} has at most
\Vsize{\Rule{\Vel{slo}{x}}} elements.

Let \var{c} be a constant greater than or equal to the length
of the longest rule in the grammar.
Since
the choice of \Vel{slo}{x} and of its rule was without loss
of generalization, we know that
$\Vsize{\Rule{\Vel{slo}{x}}} \le \var{c}$
and therefore
\[
  \el{slo}{\var{x} \ldots \var{y}} \le \var{c}.\qedhere
\]
\end{proof}

\begin{theorem}
\ttitle{Silo size}
\label{t:silo-size}
Let \var{slo} be a silo,
and let
\[
\var{comps} = \big| \lbrace \Veim{eim} | \text{\var{eim} is complete} \rbrace \big|.
\]
The number of layers in a silo is
less than or equal to
$\var{a} \times (\var{comps} + 2)$,
where \var{a} is a constant which depends on
the grammar.
\end{theorem}

\begin{proof}
Every layer is \var{slo} is either a complete EIM
or an incomplete EIM,
so that we can treat \var{slo} as a series of
\Vincr{comps}
runs, each run containing zero or more incomplete EIM's,
with each of the runs
separated by one of the \var{comps} complete EIM's.
From Theorem
\eqref{eq:consecutive-silo-incompletes-10e},
we know that the maximum length of a run of incomplete EIM's in
a silo is \var{maxrun},
where \var{maxrun} is a constant which depends on the grammar.
Letting $\var{a} = \var{maxrun}$,
\begin{align}
\label{eq:silo-size-10}
\Vsize{\var{slo}} & \le \var{comps} + (\Vincr{comps}) \times \var{a}
\\
\Vsize{\var{slo}} & \le (\var{comps} + 2) \times \var{a}
   \; \because \; \eqref{eq:silo-size-10}\qedhere
\end{align}
\end{proof}

\begin{lemma}
\ltitle{Silo reflection of non-terminals}
\label{lem:silo-reflection-nt}
Let \el{silo}{\Vincr{i}},
\Vel{silo}{i},
be two silo layers.
\begin{multline}
\label{eq:lem-silo-reflection-nt-3}
\text{If \Predot{\el{silo}{\Vincr{i}}} is a non-terminal,}
\\
\text{then
$\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{1} \op{Valid-eq}{\el{silo}{\var{i}}}.$}
\end{multline}
\end{lemma}

\begin{proof}
Without loss of generality, we let
\begin{equation}
\label{eq:lem-silo-reflection-nt-10}
\el{silo}{\Vincr{i}}
= \bigl[ [\Vsym{A} \de \Vstr{pre-B} \Vsym{B} \mydot \Vstr{post-B}], \var{a}, \var{c} \bigr].
\end{equation}
By assumption for
\eqref{eq:lem-silo-reflection-nt-3},
we have that
\begin{equation}
\label{eq:lem-silo-reflection-nt-11}
\text{\Vsym{B} is a non-terminal.}
\end{equation}

Since \Vsym{B} is a non-terminal,
we know from Theorem \ref{t:silo-causes},
that \Vel{silo}{i}, its silo cause,
is its bottom-up cause.
From Theorem \ref{t:symbolic-causes-from-effect}, we know
that the bottom-up cause of
\eqref{eq:lem-silo-reflection-nt-10}
is $\Vmk{b} \Vsym{B} \Vmk{c}$ for some \Vloc{b}.
Since \Vsym{B} is a non-terminal, by
the definition of validity for a non-terminal symbol instance,
we know that
it has an equivalent EIM which is,
without loss of generality,
\begin{equation}
\label{eq:lem-silo-reflection-nt-12}
\Vel{silo}{i} = \bigl[[\Vsym{B} \de \Vstr{B-rhs} \mydot ], \var{b}, \var{c} \bigr].
\end{equation}
The validity equivalent of
\eqref{eq:lem-silo-reflection-nt-10}
is
\begin{equation}
\label{eq:lem-silo-reflection-nt-14}
\Vsym{A} \derives \Vmk{a} \Vstr{pre-B} \Vsym{B} \Vmk{c} \Vstr{post-B}.
\end{equation}
and
the validity equivalent of
\eqref{eq:lem-silo-reflection-nt-12}
is
\begin{equation}
\label{eq:lem-silo-reflection-nt-16}
\Vsym{B} \derives \Vmk{b} \Vstr{B-rhs} \Vmk{c}.
\end{equation}
Combining
\eqref{eq:lem-silo-reflection-nt-14}
and
\eqref{eq:lem-silo-reflection-nt-16},
we have
\begin{equation}
\label{eq:lem-silo-reflection-nt-20}
\begin{aligned}
& \Vsym{A}
  && \\
\derives \; & \Vmk{a} \Vstr{pre-B} \Vsym{B} \Vmk{c} \Vstr{post-B}
  && \text{Step \var{s}} \\
\derives \; & \ldots \Vmk{b} \Vstr{B-rhs} \Vmk{c} \ldots
  && \text{Step \Vincr{s}},
\end{aligned}
\end{equation}
where we have added step numbers for convenience,
and without loss of generalization.
Recall that our convention is to say that the derivation step of an EIM
layer is the second step of its derivation move,
so that the derivation step for
\eqref{eq:lem-silo-reflection-nt-10} is at
Step \var{s},
and the derivation step for
\eqref{eq:lem-silo-reflection-nt-12} is at
Step \Vincr{s}.
Clearly,
Step \var{s} derives Step \Vincr{s} in one step,
which shows \eqref{eq:lem-silo-reflection-nt-3}.
\end{proof}

\begin{lemma}
\ltitle{Silo reflection of nulling terminal}
\label{lem:silo-reflection-nulling1}
Let \el{silo}{\Vincr{i}},
\Vel{silo}{i},
be two silo layers.
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-6}
\begin{aligned}
\text{If $\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0} \op{Valid-eq}{\el{silo}{\var{i}}}$},
\\
\qquad \text{then \Predot{\el{silo}{\Vincr{i}}} is a nulling terminal.}
\end{aligned}
\end{equation}
\end{lemma}

\begin{proof}
Without loss of generality, we let
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-10}
\el{silo}{\Vincr{i}}
= \bigl[ [\Vsym{A} \de \Vstr{pre-B} \Vsym{B} \mydot \Vstr{post-B}], \var{a}, \var{c} \bigr].
\end{equation}
The validity equivalent of
\eqref{eq:lem-silo-reflection-nulling1-10}
is
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-10a}
\Vsym{A} \derives \Vmk{a} \Vstr{pre-B} \Vsym{B} \Vmk{c} \Vstr{post-B}.
\end{equation}

We assume
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-11}
\begin{gathered}
\text{\Vsym{B} is a non-terminal} \\
\land \; \op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0} \op{Valid-eq}{\el{silo}{\var{i}}}
\end{gathered}
\end{equation}
for a reductio.
If \Vsym{B} is a non-terminal, by
the definition of validity for a non-terminal symbol instance,
we know that its parse instance has an EIM equivalent,
so that the bottom-up cause
of \eqref{eq:lem-silo-reflection-nulling1-10}
is, without loss of generality,
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-12}
\Vel{silo}{i} = \bigl[[\Vsym{B} \de \Vstr{B-rhs} \mydot ], \var{b}, \var{c} \bigr].
\end{equation}
The validity equivalent
of \eqref{eq:lem-silo-reflection-nulling1-12}
is
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-16}
\Vsym{B} \derives \Vmk{b} \Vstr{B-rhs} \Vmk{c},
\end{equation}
which implies that
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-38}
\text{$[ \Vsym{B} \de \Vstr{B-rhs} ]$ is a rule of \Cg.}
\end{equation}

We now combine
\eqref{eq:lem-silo-reflection-nulling1-10a}
and
\eqref{eq:lem-silo-reflection-nulling1-16}.
In case nulling symbols are significant,
we avoid
the use of location markers or
simplifications.
\begin{align}
\notag
& \Vsym{A} \\
\label{eq:lem-silo-reflection-nulling1-42}
\derives \; & \Vstr{pre-B} \Vsym{B} \Vstr{post-B} \\
\label{eq:lem-silo-reflection-nulling1-44}
\xderives{0} \; & \Vstr{pre-B} \Vstr{B-rhs} \Vstr{post-B}
\end{align}
Notice that the derivation from
\eqref{eq:lem-silo-reflection-nulling1-42}
to
\eqref{eq:lem-silo-reflection-nulling1-44}
takes place in zero steps,
as required by
\eqref{eq:lem-silo-reflection-nulling1-11}.
Following the implications,
\begin{align}
&
\begin{multlined}
\Vstr{pre-B} \Vsym{B} \Vstr{post-B} \\
\xderives{0} \Vstr{pre-B} \Vstr{B-rhs} \Vstr{post-B}
\end{multlined}
&&
\eqref{eq:lem-silo-reflection-nulling1-42},
\eqref{eq:lem-silo-reflection-nulling1-44}
\\
\therefore \quad &
\begin{multlined}
\Vstr{pre-B} \Vsym{B} \Vstr{post-B} \\
= \Vstr{pre-B} \Vstr{B-rhs} \Vstr{post-B}
\end{multlined}
&&
\\
\label{eq:lem-silo-reflection-nulling1-49}
\therefore \quad &
\Vsym{B} = \Vstr{B-rhs}
&&
\\
\label{eq:lem-silo-reflection-nulling1-50}
\therefore \quad &
\text{$[ \Vsym{B} \de \Vsym{B} ]$ is a rule of \Cg.}
&&
\eqref{eq:lem-silo-reflection-nulling1-38},
\eqref{eq:lem-silo-reflection-nulling1-49}
\end{align}
But the rule of
\eqref{eq:lem-silo-reflection-nulling1-50}
is a cycle and cycles are not allowed in Marpa grammars.
This concludes the reductio.
Our assumption for the reductio was
\eqref{eq:lem-silo-reflection-nulling1-11},
so we conclude that
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-52}
\begin{gathered}
\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0} \op{Valid-eq}{\el{silo}{\var{i}}} \\
\implies \; \text{\Vsym{B} is a terminal.}
\end{gathered}
\end{equation}

\eqref{eq:lem-silo-reflection-nulling1-52}
is close to the theorem, but the theorem requires that
we show that
\Vsym{B} is a \textbf{nulling} terminal.
We assume for a reductio that \Vsym{B} is a telluric
terminal.
From
\eqref{eq:lem-silo-reflection-nulling1-10},
we see, if \Vsym{B}
is a telluric terminal,
\el{silo}{\Vincr{i}} is a read EIM.
But by Theorem
\ref{t:silo-causes},
we know that a read EIM has no causes.
If \el{silo}{\Vincr{i}} has no causes,
by the definition of a silo,
there is no
silo element \Vel{silo}{i}.
But, by assumption
for the lemma,
there is a
silo element \Vel{silo}{i}.
This contradiction shows the reductio,
and we conclude that
\begin{equation}
\label{eq:lem-silo-reflection-nulling1-53}
\begin{gathered}
\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0} \op{Valid-eq}{\el{silo}{\var{i}}} \\
\implies \; \text{\Vsym{B} is not a telluric terminal.}
\end{gathered}
\end{equation}

From
\eqref{eq:lem-silo-reflection-nulling1-10},
we know that
$\Vsym{B} = \Predot{\el{silo}{\Vincr{i}}}$.
Using
\eqref{eq:lem-silo-reflection-nulling1-52}
and
\eqref{eq:lem-silo-reflection-nulling1-53}
we conclude that
\begin{equation}
\begin{gathered}
\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0} \op{Valid-eq}{\el{silo}{\var{i}}} \\
\implies \; \text{\Predot{\el{silo}{\Vincr{i}}} is a nulling terminal,}
\end{gathered}
\end{equation}
which is the theorem.
\end{proof}

\begin{lemma}
\ltitle{Silo reflection nulling induction}
\label{lem:silo-reflection-nulling-induction}
\begin{multline}
\label{eq:lem-silo-reflection-nulling-induction-10}
\text{If $\op{Valid-eq}{\Vel{silo}{hi}} \xderives{0} \op{Valid-eq}{\Vel{silo}{lo}}$,} \\
\text{then for all \var{a},} \quad
\var{hi} \ge \var{a} > \var{lo} \implies \Predot{\Vel{silo}{a}} = \epsilon.
\end{multline}
\end{lemma}

\begin{proof}
We proceed in three cases, depending on the relative
values of \var{hi} and \var{lo}.
We take as our first case,
$\var{lo} \ge \var{hi}$.
For this case
\eqref{eq:lem-silo-reflection-nulling-induction-10}
follows vacuously.

The third case remains:
$\var{lo} < \var{hi}$.
For this case
we proceed by induction,
taking as the hypothesis:
\begin{multline}
\label{eq:lem-silo-reflection-nulling-induction-20}
\tag{IND}
\text{If $\op{Valid-eq}{\Vel{silo}{hi}} \xderives{0} \op{Valid-eq}{\Vel{silo}{x}}$,} \\
\text{then for all \var{a},} \quad
\var{hi} \ge \var{a} > \var{x} \implies \Predot{\Vel{silo}{a}} = \epsilon.
\end{multline}
\eqref{eq:lem-silo-reflection-nulling-induction-20}
for $\var{x} = \Vdecr{hi}$
follows from
Lemma \ref{lem:silo-reflection-nulling1},
and we take this as the basis of the induction.

For the step,
we assume
\eqref{eq:lem-silo-reflection-nulling-induction-20}
for $\var{x} = \var{i}$
to show
\eqref{eq:lem-silo-reflection-nulling-induction-20}
for $\var{x} = \Vdecr{i}$.
The assumption for the step is
\begin{multline}
\label{eq:lem-silo-reflection-nulling-induction-30}
\text{If} \quad
\op{Valid-eq}{\Vel{silo}{hi}} \xderives{0} \op{Valid-eq}{\Vel{silo}{i}}
\\
\text{then} \quad
\forall \var{a} : \var{hi} \ge \var{a} > \var{i}
\implies
\text{\Predot{\Vel{silo}{a}} is nulling.}
\end{multline}
Lemma \ref{lem:silo-reflection-nulling1}
shows us that
\begin{multline}
\label{eq:lem-silo-reflection-nulling-induction-33}
\text{if} \quad
\op{Valid-eq}{\Vel{silo}{i}}
\xderives{0}
\op{Valid-eq}{\el{silo}{\Vdecr{i}}}
\\
\shoveleft{
\qquad \text{then \Predot{\Vel{silo}{i}}
is nulling.}
}
\end{multline}
Combining
\eqref{eq:lem-silo-reflection-nulling-induction-30}
and
\eqref{eq:lem-silo-reflection-nulling-induction-33},
we have
\begin{multline}
\label{eq:lem-silo-reflection-nulling-induction-40}
\text{if} \quad
\op{Valid-eq}{\Vel{silo}{hi}} \xderives{0} \op{Valid-eq}{\el{silo}{\Vdecr{i}}}
\\
\shoveleft{
\text{then} \quad
\forall \var{a} : \var{hi} \ge \var{a} > \Vdecr{i}
\implies
\text{\Predot{\Vel{silo}{a}} is nulling.}
}
\end{multline}
\eqref{eq:lem-silo-reflection-nulling-induction-40}
is
\eqref{eq:lem-silo-reflection-nulling-induction-20}
for $\var{x} = \Vdecr{i}$,
which is what we needed to show for the step.
With this we have the induction,
and
the induction shows
\eqref{eq:lem-silo-reflection-nulling-induction-10}
for $\var{lo} < \var{hi}$.
This was our second case, and with it we
have the theorem.
\end{proof}

\begin{lemma}
\ltitle{Silo reflection of predot null}
\label{lem:silo-reflection-nulling}
Let \el{silo}{\Vincr{i}} and
\Vel{silo}{i},
be two silo layers.
Then
\begin{multline*}
\Predot{\el{silo}{\Vincr{i}}} = \epsilon \\
\implies
\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0} \op{Valid-eq}{\el{silo}{\var{i}}}.
\end{multline*}
\end{lemma}

\begin{proof}
Without loss of generality, we let
\begin{equation}
\label{eq:lem-silo-reflection-nulling-10}
\el{silo}{\Vincr{i}} = \bigl[ [\Vsym{A} \de \Vstr{pre-B} \Vsym{B} \mydot \Vstr{post-B}], \var{a}, \var{c} \bigr],
\end{equation}
where, by assumption for the theorem,
\Vsym{B} is nulling.

Since \Vsym{B} is nulling,
we know from Theorem \ref{t:silo-causes},
that \Vel{silo}{i}, its silo cause,
is its top-down cause.
\el{silo}{\Vincr{i}} is confirmed
\eqref{eq:lem-silo-reflection-nulling-10},
so that by
\dref[causes of confirmed EIM]{def:causes-confirmed},
we know that
the top-down cause of
\eqref{eq:lem-silo-reflection-nulling-10}
is
\begin{equation}
\label{eq:lem-silo-reflection-nulling-12}
\el{silo}{\var{i}} = \bigl[ [\Vsym{A} \de \Vstr{pre-B} \mydot \Vsym{B} \Vstr{post-B}], \var{a}, \var{c} \bigr],
\end{equation}
The validity equivalent of
\eqref{eq:lem-silo-reflection-nulling-10}
is
\begin{equation}
\label{eq:lem-silo-reflection-nulling-14}
\op{Valid-eq}{\el{silo}{\Vincr{i}}} =
\Vsym{A} \derives \Vmk{a} \Vstr{pre-B} \Vsym{B} \Vmk{c} \Vstr{post-B}.
\end{equation}
and
the validity equivalent of
\eqref{eq:lem-silo-reflection-nulling-12}
is
\begin{equation}
\label{eq:lem-silo-reflection-nulling-16}
\op{Valid-eq}{\el{silo}{\var{i}}} =
\Vsym{A} \derives \Vmk{a} \Vstr{pre-B} \Vmk{c} \Vsym{B} \Vstr{post-B}.
\end{equation}
But since $\Vsym{B} \derives \epsilon$, we know that both
\eqref{eq:lem-silo-reflection-nulling-14}
and \eqref{eq:lem-silo-reflection-nulling-16}
are equivalent to
\begin{equation}
\label{eq:lem-silo-reflection-nulling-19}
\Vsym{A} \derives \Vmk{a} \Vstr{pre-B} \Vmk{c} \Vsym{B} \Vmk{c} \Vstr{post-B}.
\end{equation}
so that
\begin{equation}
\op{Valid-eq}{\el{silo}{\Vincr{i}}} \xderives{0}
\op{Valid-eq}{\el{silo}{\var{i}}}.
\qedhere
\end{equation}
\end{proof}

We next show that, for every silo,
there is a derivation which
\mbox{``reflects''} % do not hyphenate
it.

\begin{theorem}
\ttitle{Silo reflection}
\label{t:silo-reflection}
Let \el{silo}{\var{hi}} and
\Vel{silo}{lo}
be two silo layers,
such that $\var{hi} \ge \var{lo}$.
Then
\begin{equation}
\op{Valid-eq}{\Vel{silo}{hi}} \destar
\op{Valid-eq}{\Vel{silo}{lo}}.
\end{equation}
\end{theorem}

\begin{proof}
The proof is by induction, where the induction
hypothesis is
\begin{equation}
\tag{IND}
\label{eq:silo-reflection-10}
\op{Valid-eq}{\Vel{silo}{hi}} \destar
\op{Valid-eq}{\Vel{silo}{x}}.
\end{equation}
The derivation equivalent of any silo layer derives itself,
so we have
\eqref{eq:silo-reflection-10} for
$\var{x} = \var{hi}$ trivially.
We take this as the basis of our induction.

For the step of the induction we assume
\eqref{eq:silo-reflection-10}
for $\var{x} = \var{i}$ to show
\eqref{eq:silo-reflection-10}
for $\var{x} = \Vdecr{i}$.
The assumption for the step is
\begin{equation}
\tag{STEP}
\label{eq:silo-reflection-20}
\op{Valid-eq}{\Vel{silo}{hi}} \destar
\op{Valid-eq}{\Vel{silo}{i}}.
\end{equation}
By Theorem
\ref{t:silo-predot},
we know that every layer of \var{silo} has a predot symbol.
We show the step by cases, according to whether the predot symbol
of \Vel{silo}{i} is
a telluric terminal,
a nulling terminal,
or a non-terminal.

\textbf{Telluric terminal}:
We first consider the case
where
\begin{equation*}
\text{\Predot{\Vel{silo}{i}} is a telluric terminal}.
\end{equation*}
By Theorem \ref{t:silo-causes},
a silo layer with a telluric terminal predot symbol
has no silo causes.
Therefore there is no \el{silo}{\Vdecr{i}}.
This gives us
\eqref{eq:silo-reflection-10} for \Vdecr{i}
vacuously for the case of a telluric terminal.

\textbf{Nulling terminal}:
We next consider the case where
\begin{equation}
\label{eq:silo-reflection-17}
\Predot{\Vel{silo}{i}} = \epsilon.
\end{equation}
From
\eqref{eq:silo-reflection-17}
and Lemma \ref{lem:silo-reflection-nulling}, we know that
\begin{equation}
\label{eq:silo-reflection-22}
\op{Valid-eq}{\Vel{silo}{i}}
\xderives{0}
\op{Valid-eq}{\el{silo}{\Vdecr{i}}}.
\end{equation}
Combining
\eqref{eq:silo-reflection-20}
and
\eqref{eq:silo-reflection-22},
we have
\begin{equation}
\label{eq:silo-reflection-24}
\op{Valid-eq}{\Vel{silo}{hi}} \destar
\op{Valid-eq}{\el{silo}{\Vdecr{i}}}
\end{equation}
\eqref{eq:silo-reflection-24} is
\eqref{eq:silo-reflection-10} for \Vincr{i},
giving us the case of a nulling terminal.

\textbf{Non-terminal}:
We now consider the case where
\begin{equation}
\label{eq:silo-reflection-37}
\text{\Predot{\Vel{silo}{i}} is a non-terminal}.
\end{equation}
From
\eqref{eq:silo-reflection-37}
and Lemma \ref{lem:silo-reflection-nt}, we know that
\begin{equation}
\label{eq:silo-reflection-42}
\op{Valid-eq}{\Vel{silo}{i}}
\xderives{1}
\op{Valid-eq}{\el{silo}{\Vdecr{i}}}.
\end{equation}
Combining
\eqref{eq:silo-reflection-20}
and
\eqref{eq:silo-reflection-42},
we have
\begin{equation}
\label{eq:silo-reflection-44}
\op{Valid-eq}{\Vel{silo}{hi}} \destar
\op{Valid-eq}{\el{silo}{\Vdecr{i}}}
\end{equation}
\eqref{eq:silo-reflection-44} is
\eqref{eq:silo-reflection-10} for \Vincr{i},
giving us the case of a non-terminal.
This gives us the last of our three cases,
the step of the induction,
and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Silo layer is unique}
\label{t:silo-layer-unique}
No layer of a silo occurs twice.
That is, if \var{silo} is a silo,
\begin{equation}
\forall \; \var{i}, \var{j}, \Vel{silo}{i} = \Vel{silo}{j} \implies \var{i} = \var{j}
\end{equation}
\end{theorem}

\begin{proof}
Let \var{silo},
be a silo,
and \var{hi}, \var{lo}
be two layers in it.
Without loss of generalization,
let $\var{hi} \ge \var{lo}$.
We assume for a reductio that
\begin{equation}
\tag{RAA}
\label{eq:silo-layer-unique-10}
\text{$\Vel{silo}{hi} = \Vel{silo}{lo}$ and $\var{hi} \neq \var{lo}$}
\end{equation}
From Theorem
\ref{t:silo-reflection},
we know that
\begin{equation}
\label{eq:silo-layer-unique-20}
\op{Valid-eq}{\Vel{silo}{hi}} \destar
\op{Valid-eq}{\Vel{silo}{lo}}.
\end{equation}
Within the reductio,
we proceed by cases: trivial derivations,
and non-trivial derivations.

\textbf{Trivial derivation}:
We assume for an inner reductio that
\begin{equation}
\tag{RAA1}
\label{eq:silo-layer-unique-30}
\op{Valid-eq}{\Vel{silo}{hi}} \xderives{0}
\op{Valid-eq}{\Vel{silo}{lo}}
\end{equation}

From
\eqref{eq:silo-layer-unique-30}
and
Lemma
\ref{lem:silo-reflection-nulling-induction},
we have
\begin{align}
\label{eq:silo-layer-unique-40}
& \Predot{\Vel{silo}{hi}} = \epsilon
&&
\\
\label{eq:silo-layer-unique-43}
& \begin{multlined}
\text{silo cause of \Vel{silo}{hi}} \\
\text{is top-down cause}
\end{multlined}
&& \text{Th \ref{t:silo-causes}},
\eqref{eq:silo-layer-unique-40}
\\
\label{eq:silo-layer-unique-46}
&
\begin{multlined}
\Vel{silo}{hi} = \\
  \big[ [ \Vrule{r}, \var{ix} ], \Vorig{hi}, \Vloc{here} ]
\end{multlined}
&&
\text{WLOG}
\intertext{Note
  that in \eqref{eq:silo-layer-unique-46}, we are using our alternate notation
  for dotted rules, where dotted rule is a duple of rule and RHS index.
  From \eqref{eq:silo-layer-unique-40}, \eqref{eq:silo-layer-unique-46}
  and the definition of top-down
  cause for a null-scan, we have
}
\label{eq:silo-layer-unique-49}
& \begin{multlined}
\text{top-down cause of \Vel{silo}{hi} is} \\
\big[ [ \Vrule{r}, \Vdecr{ix} ], \Vorig{hi}, \Vloc{here} \big]
\end{multlined}
&&
\end{align}
For this proof, let
\[
\myfn{TDC}{\Veim{eim}} \defined
\begin{cases}
\begin{aligned}
\text{the top-down cause of \Veim{eim},} \\
\text{if $\Predot{\Veim{eim}} = \epsilon$,}
\end{aligned} \\
\undefined, \quad \text{otherwise}
\end{cases}
\]
From this definition of \myfnname{TDC},
\eqref{eq:silo-layer-unique-43}
and \eqref{eq:silo-layer-unique-49},
we have
\begin{multline}
\label{eq:silo-layer-unique-55}
\Predot{\Vel{silo}{hi}} = \epsilon  \\
\implies
\left(
\begin{gathered}
\el{silo}{\Vdecr{hi}} = \myfn{TDC}{\Vel{silo}{hi}} \\
= \big[ [ \Vrule{r}, \Vdecr{ix} ], \Vorig{hi}, \Vloc{here} \big]
\end{gathered}
\right)
\end{multline}

By iteration of
\eqref{eq:silo-layer-unique-55},
we have
\begin{multline}
\label{eq:silo-layer-unique-58}
\text{if} \quad
\forall \var{a} :
\var{hi} \ge \var{a} > \var{lo} \implies
\Predot{\Vel{silo}{a}} = \epsilon, \\
\text{then} \quad
\Vel{silo}{lo} =
\myfnname{TDC}^{\displaystyle (\xxsubtract{\var{hi}}{\var{lo}})}(\Vel{silo}{hi}) = \\
\big[ [ \Vrule{r},
\xxsubtract{\var{ix}}{
  (\xxsubtract{\var{hi}}{\var{lo}})
}
], \Vorig{hi}, \Vloc{here} \big]
\end{multline}

From Lemma
\ref{lem:silo-reflection-nulling-induction}
and
\eqref{eq:silo-layer-unique-30}
we have
\begin{equation}
\label{eq:silo-layer-unique-61}
\forall \var{a} :
\var{hi} \ge \var{a} > \var{lo} \implies
\Predot{\Vel{silo}{a}} = \epsilon,
\end{equation}
so that we can rewrite
\eqref{eq:silo-layer-unique-58}
as
\begin{multline}
\label{eq:silo-layer-unique-64}
\Vel{silo}{lo} =
\myfnname{TDC}^{\displaystyle (\xxsubtract{\var{hi}}{\var{lo}})}(\Vel{silo}{hi}) = \\
\big[ [ \Vrule{r},
\xxsubtract{\var{ix}}{
  (\xxsubtract{\var{hi}}{\var{lo}})
}
], \Vorig{hi}, \Vloc{here} \big].
\end{multline}

From
\eqref{eq:silo-layer-unique-46}
and
\eqref{eq:silo-layer-unique-64},
we have
\begin{equation}
\label{eq:silo-layer-unique-70}
\Vel{silo}{hi} = \Vel{silo}{lo} \implies \var{hi} = \var{lo}.
\end{equation}

\eqref{eq:silo-layer-unique-70}
contradicts
\eqref{eq:silo-layer-unique-10},
our assumption for the outer reductio.
This shows the inner reductio
and the case of trivial derivations.

\textbf{Non-trivial derivations}:
We next consider the case of non-trivial derivations:
\begin{equation}
\label{eq:silo-layer-unique-76}
\op{Valid-eq}{\Vel{silo}{hi}} \deplus
\op{Valid-eq}{\Vel{silo}{lo}}
\end{equation}

From \eqref{eq:silo-layer-unique-10},
we have that
$\Vel{silo}{hi} = \Vel{silo}{lo}.$
Without loss of generality, let
both
\Vel{silo}{hi} and \Vel{silo}{lo}
be
\begin{equation}
\label{eq:silo-layer-unique-85}
\big[ [ \Vsym{A} \de \Vstr{pre} \mydot \Vstr{post} ], \var{i}, \var{k} \big].
\end{equation}
so that their validity equivalents are
\begin{equation}
\label{eq:silo-layer-unique-88}
\Vsym{A} \derives \Vmk{i} \Vstr{pre} \Vmk{k} \Vstr{post}
\end{equation}

The dotted rule in a silo layer must be quasi-complete,
so that $\Vstr{post} = \epsilon$.
Therefore we can use
\eqref{eq:silo-layer-unique-88}
to write
\eqref{eq:silo-layer-unique-76}
as
\begin{equation}
\begin{aligned}
\label{eq:silo-layer-unique-93}
\Vmk{i} \Vsym{A} \Vmk{k} \derives & \; \Vmk{i} \Vsym{pre} \Vmk{k} \\
  \destar & \; \Vmk{i} \Vsym{A} \Vmk{k} \\
  \derives & \; \Vmk{i} \Vsym{pre} \Vmk{k} \\
\end{aligned}
\end{equation}
From
\eqref{eq:silo-layer-unique-93}
we have
\begin{gather}
\label{eq:silo-layer-unique-95a}
\Vmk{i} \Vsym{A} \Vmk{k} \deplus \Vmk{i} \Vsym{A} \Vmk{k} \\
\label{eq:silo-layer-unique-95b}
\text{and} \quad
 \Vmk{i} \Vsym{pre} \Vmk{k} \deplus \Vmk{i} \Vsym{pre} \Vmk{k}
\end{gather}
Using Theorem
\ref{t:location-marker-cycle},
we see that both
\eqref{eq:silo-layer-unique-95a}
and
\eqref{eq:silo-layer-unique-95b}
are cycles,
which are not
allowed in a Marpa grammar.
This contradicts
\eqref{eq:silo-layer-unique-10},
and shows the reductio for non-trivial
derivations.

We have already shown
the reductio for trivial
derivations.
We now have
both cases,
the reductio
and therefore, the theorem.
\end{proof}

\begin{theorem}
\ttitle{Silos are finite}
\label{t:silo-finite}
Every silo is of finite height.
\end{theorem}

\begin{proof}
By Theorem
\ref{t:es-count}, the number of Earley items
with a single right location is finite.
By Theorem
\ref{t:silo-location},
all the layers of a silo share the same right location.
So either a silo has finite length, or the same layer
occurs more than once in a silo.
But, by Theorem
\ref{t:silo-layer-unique},
no silo layer occurs
more than once in a silo.
\end{proof}

\begin{theorem}
\ttitle{Grounded silo}
\label{t:grounded-silo}
Every silo is part of
a silo of finite length,
whose bottom is a read EIM.
\end{theorem}

\begin{proof}
Let \var{slo} be a silo.
Let \var{sloset}
be the set of all silos of which \var{slo} is a part.
\var{sloset} has at least one element
--- \var{slo} itself.
By Theorem
\ref{t:silo-finite}
all of these silos in \var{sloset} have a finite length,
so there is a finite maximum length for the silos
in \var{sloset}.
Call this length \var{maxl}.
There will be at least one silo,
call it \var{gslo},
such that
$\var{gslo} \in \var{sloset}$
and the length of \var{gslo} is \var{maxl}.

Assume, for a reductio,
that $\Veim{bot} = \el{gslo}{0}$
is not a read EIM.
Since it is not a read EIM,
by Theorem \ref{t:silo-causes},
\Veim{bot} has a silo cause.
Therefore
a silo layer could be added below \Veim{bot}.
But if a silo layer could be added below \Veim{bot},
then \Veim{bot} is not at the bottom of a silo
of maximum length,
which is contrary to assumption for \var{gslo}.
Since there was at least one silo \var{gslo} that satisfied
the assumptions for \var{gslo},
we conclude that \Veim{bot} is a read EIM.
\end{proof}

\begin{theorem}
\ttitle{EIM grounded silo}
\label{t:eim-grounded-silo}
Every quasi-confirmed EIM has
a silo of finite length,
whose bottom is a read EIM.
\end{theorem}

\begin{proof}
By the definition of silo,
the sequence consisting only of
\Veim{quasi} is a silo.
This theorem follows from this
observation
and
Theorem
\ref{t:grounded-silo}.
\end{proof}

\begin{definition}
\ttitle{Fleeting closure silo}
\label{def:fleeting-closure-silo}
\var{slo} is
the \dfn{fleeting closure silo}
if and only if
these two conditions hold:
\begin{itemize}
\item
\Veim{qc} is quasi-complete,
\item
\var{slo} is the fleeting closure of \Veim{qc}.
\end{itemize}
\end{definition}

\begin{theorem}
\ttitle{Fleeting closure silo properties}
\label{t:fleeting-closure-silo-props}
Assume that
\begin{subequations}
\renewcommand{\theequation}{A\arabic{equation}}
\begin{equation}
\label{eq:fleeting-closure-silo-prop-asm-1}
\myparbox{%
\var{slo} is the fleeting closure silo of
\Veim{qc}.
}
\end{equation}
\end{subequations}

Under that assumption,
we have

TODO

\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:fleeting-closure-silo-prop-req-1}
& \myparbox{%
$\var{slo} = \op{fleeting-closure}{\Veim{qc}}$
\becuz{}
\eqref{eq:fleeting-closure-silo-prop-asm-1},
\dref[fleeting closure silo]{def:fleeting-closure-silo}
}
\\
\label{eq:fleeting-closure-silo-prop-req-3}
& \el{slo}{0} = \Veim{qc}.
\\
\label{eq:fleeting-closure-silo-prop-req-5}
& \text{\var{slo} contains at least one layer.}
\\
\label{eq:fleeting-closure-silo-prop-req-9}
& \text{\var{slo} contains at most \Vsize{\Rule{\el{slo}{0}}}
  layers
}
\\
\label{eq:fleeting-closure-silo-prop-req-10}
& \text{$\var{slo}\big[ \Vlastix{slo} \big]$
  is a complete EIM.
}
\\
\label{eq:fleeting-closure-silo-prop-req-12}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} < \Vlastix{slo} \\
& \quad \implies \text{\Vel{slo}{a} is an incomplete EIM}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-13}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{slo} \\
& \quad \implies \text{\Vel{slo}{a} is a quasi-complete EIM}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-14}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{slo}
  \implies \Valid{\Vel{slo}{a}}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-16}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{slo} \\
& \qquad \implies \op{Right}{\el{slo}{0}} = \op{Right}{\Vel{slo}{a}}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-18}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \Vlastix{slo} \\
& \qquad \implies \op{Rule}{\el{slo}{0}} = \op{Rule}{\Vel{slo}{a}}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-20}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \decr{\Vlastix{slo}} \\
& \qquad \implies \text{\Vel{slo}{a} is the unique
  top-down cause of \el{slo}{\Vincr{a}}
}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-21}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \decr{\Vlastix{slo}} \\
& \qquad \implies \text{\Vel{slo}{a} is
  the unique silo cause of \el{slo}{\Vincr{a}}
}
\end{aligned}
\\
\label{eq:fleeting-closure-silo-prop-req-req-22}
& \begin{aligned}
& \forall \var{a} : 0 \le \var{a} \le \decr{\Vlastix{slo}} \\
& \qquad \implies \text{\el{slo}{\Vincr{a}}
  is the unique effect of \Vel{slo}{a}
}
\end{aligned}
\end{align}
\end{subequations}

\end{theorem}

\begin{proof}
\eqref{eq:fleeting-closure-silo-5}
follows from
\begin{itemize}
\item
the assumption for the theorem that \el{slo}{0} is quasi-complete;
\item
\eqref{eq:quasi-complete-fleeting-closure-properties-13},
\eqref{eq:quasi-complete-fleeting-closure-properties-16}
and
\eqref{eq:quasi-complete-fleeting-closure-properties-20}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
and
\item
the definition of a silo;
\end{itemize}

For the fleeting closure silo properties,
\begin{itemize}
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-5}
follows from
\eqref{eq:fleeting-closure-silo-5};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-9}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-9}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties}.
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-10}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-10}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-12}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-12}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-13}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-13}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-14}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-14}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-16}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-16}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-18}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-18}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-20}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-20}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-21} follows from
\eqref{eq:fleeting-closure-silo-prop-req-13},
\eqref{eq:fleeting-closure-silo-prop-req-16}
and
\eqref{eq:fleeting-closure-silo-prop-req-20};
\item
Property
\eqref{eq:fleeting-closure-silo-prop-req-22}
follows from
\eqref{eq:quasi-complete-fleeting-closure-properties-22}
of Theorem
\ref{t:quasi-complete-fleeting-closure-properties}.
\qedhere
\end{itemize}
\end{proof}

\begin{definition}
\dtitle{Completion of a fleeting closure silo}

TODO: Eliminate all references to "completion" of a silo?
Or revise?

If \var{fcs} is a fleeting closure silo,
we say that \el{fcs}{\Vlastix{fcs}}
is the
\xdfn{completion}{completion@completion (EIM)!of a fleeting closure silo}
of \var{fcs}.
\end{definition}

\begin{definition}
\dtitle{Maximal silo}
A
\dfn{maximal silo}
is a silo whose bottom layer has no silo cause,
and whose top layer has no silo effect.
\end{definition}

We sometimes write \Maximal{\var{slo}}%
\index{recce-notation}{Maximal(slo)@\Maximal{\var{slo}}}
to say that the silo \var{slo} is maximal.

\begin{theorem}
\ttitle{Maximal fleeting closure silo}
\label{t:maximal-fleeting-closure-silo}
Let \Veim{qc} be a valid quasi-complete EIM,
and let \Veim{bas} be its lasting base.
Then there is a silo, call it \var{slo},
such that
\begin{equation}
\notag
\el{slo}{0} = \Veim{bas}
\end{equation}
and \var{slo} is a
fleeting closure silo.
\end{theorem}

\begin{proof}
By assumption for the theorem,
\Veim{bas} is the lasting base of \Veim{qc}.
By Theorem \ref{t:eim-lasting-base}, \Veim{qc}
has a valid lasting base:
\begin{equation}
\label{eq:maximal-fleeting-closure-silo-10}
\Valid{\Veim{bas}}.
\end{equation}
By assumption for the theorem, \Veim{qc}
is quasi-complete,
so that, by the definition
of quasi-complete, all the symbols
in the dot suffix of \Veim{qc}
are nulling.
By the definition of a lasting base,
all of the symbols between
\Dotix{\Veim{bas}}
and
\Dotix{\Veim{qc}}
are nulling.
Therefore all of the symbols in the dot
suffix of \Veim{bas} are nulling,
so that, by the definition of quasi-complete,
\begin{equation}
\label{eq:maximal-fleeting-closure-silo-15}
\text{\Veim{bas} is quasi-complete.}
\end{equation}
This theorem follows from
\eqref{eq:maximal-fleeting-closure-silo-10},
\eqref{eq:maximal-fleeting-closure-silo-15}
and Theorem
\ref{t:fleeting-closure-silo}.
\end{proof}

\begin{theorem}
\ttitle{Maximal silo}
\label{t:maximal-silo}
Every silo is part of
at least one finite maximal silo,
whose bottom is a read EIM.
\end{theorem}

\begin{proof}
Let \var{slo0} be a silo.
We create, \var{maxslo}, a maximal silo,
from \var{slo}
using the following construction:
\begin{itemize}
\item
\textbf{Step 1}:
By Theorem
\ref{t:grounded-silo},
\var{slo0} is part of at least one finite silo
whose bottom is a read EIM.
Initially, let \var{workslo} be one of these silos.
\item
\textbf{Step 2}: If \el{workslo}{\Vlastix{workslo}} has no silo effect,
the let $\var{maxslo} \gets \var{workslo}$,
and terminate the construction.
\item
\textbf{Step 3}:
Let \Veim{newlayer} be the silo effect of
\el{workslo}{\Vlastix{workslo}}.
Let \var{newslo} be
\var{workslo} with \Veim{newlayer} appended,
that is
\begin{equation}
\notag
\Vel{newslo}{i} =
\begin{cases}
\text{\Vel{workslo}{i},
if $0 \le \var{i} \le \Vlastix{workslo}$}
\\
\text{\Veim{newlayer}, if
$\var{i} = \Vincr{\Vlastix{workslo}}$}
\end{cases}
\end{equation}
\item
\textbf{Step 4}:
Let $\var{workslo} \gets \var{newslo}$,
and go to Step 2.
\end{itemize}
This construction either creates a \var{maxslo} whose top
element has no silo effect,
or it constructs a silo of infinite size.
Since
by Theorem \ref{t:silo-finite},
we know that all silos are finite,
we can conclude that there is a \el{maxslo}{\Vlastix{maxslo}},
and that it has no silo effect.

Throughout the construction, \el{workslo}{0}
remains constant.
The construction initialized
\el{workslo}{0} to a read EIM.
Read EIM's,
by Theorem \ref{t:silo-causes},
have no silo cause.
once the construction is complete,
$\el{maxslo}{0} = \el{workslo}{0}$,
and therefore
\el{maxslo}{0} has no silo cause.
\end{proof}

\begin{theorem}
\ttitle{EIM maximal silo}
\label{t:eim-maximal-silo}
Every quasi-complete EIM
is in at least one finite maximal silo,
whose bottom is a read EIM.
\end{theorem}

\begin{proof}
Let \Veim{qc} be a valid quasi-complete EIM.
By the definition of silo,
the sequence consisting only of
\Veim{qc} is a silo.
This theorem follows from this observation,
and Theorem \ref{t:maximal-silo}.
\end{proof}

\begin{theorem}
\ttitle{Maximal silo bottom is read EIM}
The bottom of every maximal silo is
a read EIM.
\end{theorem}

\begin{proof}
By Theorem \ref{t:silo-finite},
we know that all silos are finite,
so that every maximal silo has a bottom EIM.
By definition of a maximal silo,
its bottom layer has no silo cause.
By Theorem \ref{t:silo-causes},
the only silo layers without
silo causes are read EIM's.
\end{proof}

\begin{theorem}
\ttitle{Maximal silo top is complete}
\label{maximal-silo-top-is-complete}
The top of every maximal silo is
a complete EIM.
\end{theorem}

\begin{proof}
Let \var{mslo} be a maximal silo.
By Theorem \ref{t:silo-finite},
we know that all silos are finite,
so that \var{mslo} has a top EIM.
\begin{align}
\label{maximal-silo-top-is-complete-10}
& \text{\Veim{top} = \el{mslo}{\Vlastix{mslo}}: WLOG}
\\
\label{maximal-silo-top-is-complete-12}
& \text{\Veim{top} is incomplete: ASM for a reductio}
\\
\label{maximal-silo-top-is-complete-20}
& \text{\Veim{top} is a silo layer}:
\eqref{maximal-silo-top-is-complete-10}
\\
\label{maximal-silo-top-is-complete-13}
& \text{$\Veim{top} \in \var{fc}$,
where \var{fc}
is fleeting closure:
Th \ref{t:eim-lasting-base},
WLOG
}
\\
\label{maximal-silo-top-is-complete-15}
& \text{\Veim{top} is quasi-complete:
\eqref{maximal-silo-top-is-complete-20},
Def of silo
}
\\
\label{maximal-silo-top-is-complete-23}
& \text{\el{fc}{\Vlastix{fc}} is complete:
\eqref{maximal-silo-top-is-complete-15},
\eqref{eq:quasi-complete-fleeting-closure-properties-10}
of
Th \ref{t:quasi-complete-fleeting-closure-properties}
}
\\
\label{maximal-silo-top-is-complete-26}
& \el{fc}{\Vlastix{fc}} \neq \Veim{top}: \;
\eqref{maximal-silo-top-is-complete-12},
\eqref{maximal-silo-top-is-complete-23}
\\
\label{maximal-silo-top-is-complete-28}
& \text{\Veim{top} has a silo effect:
\eqref{maximal-silo-top-is-complete-13},
\eqref{maximal-silo-top-is-complete-26},
\eqref{eq:quasi-complete-fleeting-closure-properties-22} of
Th \ref{t:quasi-complete-fleeting-closure-properties}
}
\\
\label{maximal-silo-top-is-complete-30}
& \Veim{top} \neq \el{mslo}{\Vlastix{mslo}}:
\eqref{maximal-silo-top-is-complete-28},
\; \text{Def of maximal silo}
\end{align}
\eqref{maximal-silo-top-is-complete-10}
contradicts
\eqref{maximal-silo-top-is-complete-30},
which gives us the reductio that began at
\eqref{maximal-silo-top-is-complete-12}.
From the reductio we conclude that \Veim{top}
is complete.
\end{proof}

\begin{theorem}
\ttitle{Maximal fleeting silo in maximal silo}
\label{t:maximal-fleeting-silo-in-maximal-silo}
Let \var{mslo} be a maximal silo.
Let \Veim{eim} be an EIM,
such that $\Veim{eim} \in \var{mslo}$.
Let \var{mfc} be the maximal fleeting closure of
\Veim{eim}.
Then $\var{mfc} \subseteq \var{mslo}$.
\end{theorem}

\begin{proof}
By assumption for the theorem,
\Veim{eim} is in a maximal silo,
so that \Veim{eim} must be quasi-complete.
Recall that the fleeting closure is defined in terms of
\myfnname{null-scan-op},
which we have shown to be a function with an inverse.
If
\[
\begin{gathered}
\Veim{cuz} \neq \undefined
\land \; \Veim{eff} \neq \undefined \\
\land \;  \Vop{null-scan-op}{\Veim{cuz}} = \Veim{eff},
\end{gathered}
\]
we have,
from Theorem \ref{t:null-scan-from-down-cause},
\begin{gather}
\label{eq:maximal-fleeting-silo-in-maximal-silo-4}
\myparbox{$\Right{\Veim{cuz}} = \Right{\Veim{eff}}$;} \\
\label{eq:maximal-fleeting-silo-in-maximal-silo-5}
\myparbox{\Veim{cuz} is quasi-complete
if and only if
\Veim{eff} is quasi-complete; and
} \\
\label{eq:maximal-fleeting-silo-in-maximal-silo-6}
\myparbox{\Veim{cuz} is the top-down cause of \Veim{eff}}.
\end{gather}
It follows
from
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-4},
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-5},
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-6}
and the definition of silo that
\begin{gather}
\label{eq:maximal-fleeting-silo-in-maximal-silo-10}
\myparbox{
if \Veim{cuz} is quasi-complete, \Veim{eff} is its
silo effect, and
} \\
\label{eq:maximal-fleeting-silo-in-maximal-silo-12}
\myparbox{
if \Veim{eff} is quasi-complete, \Veim{cuz} is its
silo cause.
}
\end{gather}

We proceed by two inductions, a forward
induction on the effects
of \Veim{eim},
and a reverse induction on the causes of \Veim{eim}.
We take as the induction hypothesis for both inductions
\begin{equation}
\tag{IND}
\label{eq:maximal-fleeting-silo-in-maximal-silo-20}
\begin{gathered}
\text{\Veim{x} is quasi-complete and} \\
\Veim{x} \in \var{mfc} \implies
\Veim{x} \in \var{mslo}
\end{gathered}
\end{equation}
By the definition of a maximal fleeting closure,
an EIM is in its own maximal fleeting closure,
so $\Veim{eim} \in \var{mfc}$.
By assumption for the theorem,
\Veim{eim} is quasi-complete and
$\Veim{eim} \in \var{mslo}$.
This gives us
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \var{eim}$, which we take as the
basis of both inductions.

For the step of the forward induction,
we assume
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \iop{null-scan-op}{\var{i}}{\var{eim}}$,
to show
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \iop{null-scan-op}{(\Vincr{i})}{\var{eim}}$.
By assumption for the step, there is some \var{slix}
and some \var{fcix}
such that
\[
\Vel{mfc}{fcix} =
\Vel{mslo}{slix} = \iop{null-scan-op}{\var{i}}{\var{eim}}.
\]
If
\[
\iop{null-scan-op}{(\Vincr{i})}{\var{eim}} = \undefined,
\]
we have
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \iop{null-scan-op}{(\Vincr{i})}{\var{eim}}$,
vacuously.
Otherwise, by assumption for the step,
\Vel{mfc}{fcix} is quasi-complete,
so that
by \eqref{eq:maximal-fleeting-silo-in-maximal-silo-10},
\[
  \Vel{mslo}{slix} = \iop{null-scan-op}{\var{i}}{\var{eim}}
\]
has a silo effect.
Therefore, by the definition of a maximal silo,
\Vel{mslo}{\var{slix}} cannot be the top of the maximal silo,
and \Vel{mslo}{\Vincr{slix}} must have a defined value.
The effect of
\iop{null-scan-op}{\var{i}}{\var{eim}} is unique,
so that
\begin{equation}
\label{eq:maximal-fleeting-silo-in-maximal-silo-30}
\Vel{mfc}{\Vincr{fcix}} =
\Vel{mslo}{\Vincr{slix}} = \iop{null-scan-op}{(\Vincr{i})}{\var{eim}}.
\end{equation}
And,
from
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-5},
we know that
\iop{null-scan-op}{(\Vincr{i})}{\var{eim}}
is quasi-complete.
This shows the step for the forward induction,
and the forward induction.

It remains to show the step of the reverse induction.
The reasoning is very similar to that for the step of
the forward induction.
We assume
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \iop{null-scan-op}{\var{i}}{\var{eim}}$,
to show
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \iop{null-scan-op}{(\Vdecr{i})}{\var{eim}}$.
Again, by assumption for the step,
there is some \var{slix}
and some \var{fcix}
such that
\[
\Vel{mfc}{fcix} =
\Vel{mslo}{slix} = \iop{null-scan-op}{\var{i}}{\var{eim}}.
\]
If
\[
\iop{null-scan-op}{(\Vdecr{i})}{\var{eim}} = \undefined,
\]
we have
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-20}
for $\var{x} = \iop{null-scan-op}{(\Vdecr{i})}{\var{eim}}$,
vacuously.
Otherwise,
\Vel{mfc}{fcix} is quasi-complete by assumption for the step,
and it follows that from that and
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-12} that
\Vel{mslo}{slix} has a silo cause.
Since it has a silo cause,
\Vel{mslo}{slix} cannot be the bottom of a maximal silo.
The value of
$\el{mfc}{\Vdecr{fcix}} = \iop{null-scan-op}{(\Vdecr{i})}{\var{eim}}$,
is unique and is a silo cause,
and
\el{mslo}{\Vdecr{slix}} must be the silo cause
of
\Vel{mslo}{slix},
so that
\begin{equation}
\notag
\el{mslo}{\Vdecr{slix}} =
\el{mfc}{\Vdecr{fcix}} = \iop{null-scan-op}{(\Vdecr{i})}{\var{eim}}.
\end{equation}
For the step of the reverse induction,
we also need to show that
\begin{equation}
\label{eq:maximal-fleeting-silo-in-maximal-silo-50}
\text{\iop{null-scan-op}{(\Vdecr{i})}{\var{eim}} is quasi-complete.}
\end{equation}
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-50}
follows from
\eqref{eq:maximal-fleeting-silo-in-maximal-silo-5}
and the assumption for the step.
With this we have the step of the reverse induction.
\end{proof}

\chapter{Leo memos}
\label{ch:leo}

\section{The history of a conjecture}

Jay Earley~\cite[p. 60]{Earley1968}%
\index{recce-general}{Earley, Jay}
conjectured that \Earley{} could be
modified to be \On{} for
all deterministic context-free grammars (DCFG's).
(The DCFG's are the union of the
\LRk{} grammars for all \var{k}.)
He gave no details of the method he had in mind.
Earley left the field shortly thereafter ---
by 1973 he had earned a second Ph.D. and
was a practicing psychotherapist in California.

In the late 1980's, Joop Leo%
\index{recce-general}{Leo, Joop}
also conjectured that
Earley's algorithm could be modified to be linear for all
DCFG's.
Leo was initially unaware of Earley's earlier conjecture ---
he discovered it in the course of writing up his
discovery.
Leo published his method in~\cite{Leo1991}.

The problem both investigators noticed was that,
while \Earley{} is \On{}
for left recursion,
and in fact very efficient,
it is $\order{\var{n}^2}$ for right recursion.
This is because all the EIM's necessary for a right
recursion are created at every parse location
where the right recursion might end.

For simplicity,
in the discussion of this section,
we will assume that the grammar is unambiguous,
or at least that it is not ambiguous in a way that affects
the right recursion we are discussing.
We will call each potential end location of a right recursion,
an \dfn{EORR},
and will will call
the EIM's needed to represent the right recursion
at an EORR, an \dfn{EORR set}.

In \Earley,
if the length of the right
recursion at an EORR is \var{n}, then the EORR set contains \var{n} EIM's.
The total number of EIM's in the EORR sets
needed for a right recursion of length \var{n} is
\[
  \sum_{\var{i} = 1}^\var{n} \var{i} = \order{\var{n}^2}.
\]
Of these EIM's, only \var{n} will actually be needed ---
the rest are useless.

Leo's idea was to memoize the right recursions.
With Leo memoization, each EORR set is represented by
a pair of EIM's and a memo.
There are \Oc{} Leo memos per Earley set,
so the time and space complexity
of an EORR set is \Oc{}.
The time and space complexity of all the EORR
sets in
a right recursion of length \var{n} will
be
\[
  \sum_{\var{i} = 1}^\var{n} 1 = \On.
\]

If, at evaluation time,
it is desirable to expand the Leo memoizations,
only the EORR set actually used in the parse
needs to be expanded.
All of the EIM's actually used in a right recursion
will be in a single EORR set.
The number of memoized
EIM's that need to be expanded
will be \On{},
where \var{n} is the length of the recursion.
As a result,
even if the time and space
required to expand Leo memoization
during evaluation
are taken into account,
the time and space complexity of
a right recursion become
$\On{} = \On{} + \On{}$.

Joop Leo%
\index{recce-general}{Leo, Joop}
showed that,
with his modification, Earley's algorithm
is \On{} for all LR-regular grammars.
LR-regular is LR where lookahead
is infinite length, but restricted to
distinguishing between regular expressions.
Earley did not claim \On{} for LR-regular
because LR-regular was not introduced
to the literature until 1973~\cite{Culik1973}.
Even in 1991, LR-regular was not well-known,
which is why Leo only claims
the weaker \LRk{} bound in
his title.

Summarizing Leo's method,
it consists of spotting potential right recursions
and memoizing them.
Leo restricts the memoization to situations where
the right recursion is unambiguous.
Potential right recursions are memoized by
Earley set, using what Leo called
``transitive items''.
In this monograph, Leo's ``transitive items''
will be called Leo memos.

Implementation of Leo memoization
will be considered in full detail,
and its correctness proved,
in Section \ref{ch:recce}.
In this chapter, we develop
a conceptual framework for Leo memoization.
We define, at an abstract level,
the data structures
that Leo memoization requires,
and we demonstrate their basic properties.

\section{Definition}

Leo memos have type \dtype{LEO}.
In each Earley set, there is at most one Leo memo per symbol.
A Leo memo is the 4-tuple
\begin{equation}
\label{eq:def-leo-memo-10}
\Vleo{leo} = [ \Vsym{transition}, \Vdr{top}, \Vorig{top}, \Vloc{memloc} ].
\end{equation}
For \Vleo{leo} as in
\eqref{eq:def-leo-memo-10},
we write
\begin{alignat*}{1}
\Symbol{\Vleo{leo}} & \; \text{to say \Vsym{transition}}, \\
\DR{\Vleo{leo}} & \; \text{to say \Vdr{top}}, \\
\Left{\Vleo{leo}} & \; \text{to say \Vorig{top}} \\
\text{and \Current{\Vleo{leo}}} & \; \text{to say \Vloc{memloc}.}
\end{alignat*}

Intuitively, \Vleo{leo},
the Leo memo of
\eqref{eq:def-leo-memo-10},
states an intent to memoize
some of the layers of certain silos occuring after
\Current{\Vleo{leo}}.
The elements
\Symbol{\Vleo{leo}},
\DR{\Vleo{leo}},
and \Left{\Vleo{leo}}
are
used to define which silo layers will be memoized
in a way that will be detailed later in this chapter.
\Vsym{transition}
in \eqref{eq:def-leo-memo-10}
is the
\dfn{Leo transition symbol}
or
\xdfn{transition symbol}{transition symbol!wrt a Leo memo}.
\DR{\Vleo{leo}} must be quasi-complete.

\Vleo{leo} is considered to be located at \Vloc{memloc},
and \Vloc{memloc} is called the
\xdfn{current location}{current location!wrt a Leo memo}
of \Vleo{leo}.
We will sometimes speak of \Vleo{leo} as being in the
Earley set at \Vloc{memloc},
although \Vleo{leo} is \textbf{not}
an Earley item,
and therefore, strictly speaking,
not in any Earley set.

\begin{definition}
\dtitle{Locsym of a Leo memo}
\label{def:leo-locsym}
The
\qdfn{locsym}%
\index{recce-definitions}{locsym@locsym!of a Leo memo}
of the Leo memo \Vleo{l}
is
\[
<\Symbol{\Vleo{l}}, \Current{\Vleo{l}}>.
\]
We also write the locsym of \Vleo{l} as \LSY{\Vleo{l}}.
\end{definition}

\section{Leo memo validity}

We now look at the conditions under which Leo memos become valid.
Recall that
we say that \Vdr{q} is a \dfn{quasi-penult}
if and only if it is
\begin{equation*}
\begin{split}
& \Vdr{q} = [ \Vsym{A} \de \Vstr{before} \mydot \Vsym{B} \cat \Vstr{after} ] \\
& \qquad \text{for some $[ \Vsym{A} \de \Vstr{before} \cat \Vsym{B} \cat \Vstr{after} ] \in \Crules$} \\
& \qquad \qquad \text{such that $\Vstr{after} \derives \epsilon$ and $\Vstr{B} \nderives \epsilon$}.
\end{split}
\end{equation*}

\begin{definition}
\dtitle{Postdot-unique}
\label{def:postdot-unique}
An EIM is \dfn{postdot-unique} if its postdot locsym
is unique.
That is,
\Veim{uniq} is \dfn{postdot-unique}
if and only if
for all \Veim{eim} in the parse,
\begin{multline}
\label{eq:def-postdot-unique-10}
\Postdot{\var{eim}} = \Postdot{\var{uniq}} \\
\implies  (\var{eim} = \var{uniq}
\; \vee \;
 \Current{\var{eim}} \neq \Current{\var{uniq}}).
\end{multline}
\end{definition}

\begin{definition}
\dtitle{Leo-eligible}
\label{def:leo-eligible}
A rule is
\xdfn{Leo-eligible}{Leo-eligible (rule)}
if and only if it is right-recursive.
A dotted rule is
\xdfn{Leo-eligible}{Leo-eligible (dotted rule)}
if and only if
its rule is Leo-eligible,
and it is a quasi-penult.
An EIM is
\xdfn{Leo-eligible}{Leo-eligible (EIM)}
if and only if
its dotted rule is Leo-eligible,
and it is postdot-unique.
\end{definition}

In Leo's original algorithm,
and in early versions of the Marpa algorithm,
all rules were treated
as Leo-eligible,
not just those rules which are
right-recursive.
Experience with Marpa showed that,
while the costs of Leo memoization are
quite manageable,
they do exist,
so that it makes sense to
target Leo memoization carefully.
If all penults are memoized,
many memoizations will be performed where
the longest potential Leo sequence is short,
and the payoff from Leo memoization
is therefore very limited.
By restricting Leo memoization to right-recursive rules,
\Marpa{} incurs the cost of Leo memoization only in cases
where EORR sets can grow arbitrarily
large.

\begin{definition}
\label{def:basis-of-leo-memo}
\dtitle{Basis of a Leo memo}
Let \Vleo{eff} be a Leo memo.
We say that \Veim{basis} is
a \xdfn{basis}{basis (EIM)!wrt a Leo memo}
of \Vleo{eff} if and only if
both of the following conditions are true:
\begin{itemize}
\item
\Veim{bas} is Leo-eligible.
\item
$\LSY{\Vleo{eff}} = \PLSY{\Veim{basis}}$.
\end{itemize}
When \Veim{basis} is the basis of \Vleo{eff},
we say that \Veim{basis} is a
\xdfn{bottom-up cause}{bottom-up cause (of a Leo memo)}
of \Vleo{eff}
and that \Vleo{eff} is the
\xdfn{effect}{effect!LEO as the effect of an EIM and
   optionally, another LEO}
of \Veim{basis}.
\end{definition}

\begin{theorem}
\ttitle{Leo basis uniqueness by postdot locsym}
\label{leo-basis-uniqueness-by-postdot-locsym}
For every postdot locsym, there is at most one Leo basis.
\end{theorem}

\begin{proof}
Let \Veim{bas1} be the basis of \Vleo{l1},
and
let \Veim{bas2} be the basis of \Vleo{l2}.
For the purpose of this proof, we make no assumption
about whether or not \Vleo{l1} and \Vleo{l2}
are distinct.

Assume for a reductio that
\begin{equation}
\label{leo-basis-uniqueness-by-postdot-locsym-10}
\tag{RAA}
\begin{gathered}
\Veim{bas1} \neq \Veim{bas2} \; \text{and}
\\
\text{\Veim{bas1} and \Veim{bas2} have the same postdot locsym.}
\end{gathered}
\end{equation}
We know that \Veim{bas1} is Leo-eligible
\dref[basis of a Leo memo]{def:basis-of-leo-memo}.
Therefore \Veim{bas1} is postdot-unique
\dref[Leo eligibility of an EIM]{def:leo-eligible}.
Therefore \Veim{bas1} and \Veim{bas2}
cannot have the same postdot locsym
\dref[postdot unique]{def:postdot-unique}.
This contradicts
\eqref{leo-basis-uniqueness-by-postdot-locsym-10}
and show the reductio and the theorem.
\end{proof}

\begin{lemma}
\ltitle{Leo basic locsym uniqueness}
\label{lem:leo-basis-locsym-uniqueness}
Let
\Vleo{l1}, \Vleo{l2}
be two Leo memos
with the same locsym,
that is
\begin{equation}
\label{eq:leo-basis-locsym-uniqueness-10}
\LSY{\Vleo{l1}} = \LSY{\Vleo{l2}}
\end{equation}
Let \Veim{b1} be the EIM basis of \Vleo{l1} and
let \Veim{b2} be the EIM basis of \Vleo{l2}.
Then $\Veim{b1} = \Veim{b2}$.
\end{lemma}

\begin{proof}
Assume, for a reductio,
that
\eqref{eq:leo-basis-locsym-uniqueness-10}
holds, and
that $\Veim{b1} \neq \Veim{b2}$.
By the definition of the basis of a Leo memo,
\begin{equation}
\label{eq:leo-basis-locsym-uniqueness-16}
\begin{gathered}
\PLSY{\Veim{b1}} = \LSY{\Vleo{l1}}
\\
\PLSY{\Veim{b2}} = \LSY{\Vleo{l2}}
\end{gathered}
\end{equation}
so that,
\begin{align}
\label{eq:leo-basis-locsym-uniqueness-22}
& \PLSY{\Veim{b1}} = \PLSY{\Veim{b2}}
\becuz
\eqref{eq:leo-basis-locsym-uniqueness-10},
\eqref{eq:leo-basis-locsym-uniqueness-16}.
\\
\label{eq:leo-basis-locsym-uniqueness-24}
& \Veim{b1} \neq \Veim{b2} \becuz
\text{ASM for reductio}.
\\
\label{eq:leo-basis-locsym-uniqueness-26}
& \myparbox{%
\Veim{b1} is not postdot-unique
\becuz{}
\eqref{eq:leo-basis-locsym-uniqueness-22},
\eqref{eq:leo-basis-locsym-uniqueness-24}.
} \\
\label{eq:leo-basis-locsym-uniqueness-28}
& \myparbox{%
\Veim{b1} is not Leo-eligible
\becuz{}
\eqref{eq:leo-basis-locsym-uniqueness-26},
\dref[Leo eligibility of an EIM]{def:leo-eligible}.
} \\
\label{eq:leo-basis-locsym-uniqueness-30}
& \myparbox{%
\Veim{b1} is not the basis of a Leo memo
\becuz{}
\eqref{eq:leo-basis-locsym-uniqueness-28},
\dref[basis of a Leo memo]{def:basis-of-leo-memo}.
} \\
\label{eq:leo-basis-locsym-uniqueness-32}
& \myparbox{%
\Veim{b1} is the basis of \Vleo{l1}
\becuz{}
ASM for the theorem.
}
\end{align}
The contradiction between
\eqref{eq:leo-basis-locsym-uniqueness-30}
and 
\eqref{eq:leo-basis-locsym-uniqueness-32}
shows the reductio and the theorem.
\end{proof}

\begin{definition}
\label{def:down-cause-of-leo-memo}
\dtitle{Top-down cause of an Leo memo}
Let \Veim{basis} be an EIM, and let
\Vleo{eff} be a Leo memo,
where \Veim{basis} is the basis of \Vleo{eff}.
Let \Vleo{down} be a Leo memo.
If and only if
\begin{equation*}
  \LSY{\Vleo{down}} = \LSY{\Veim{basis}},
\end{equation*}
we say that
\Vleo{down} is a
\xdfn{top-down cause}{top-down cause!LEO top-down cause of a 2nd Leo memo}%
\index{recce-definitions}{matching!LEO, of an incomplete EIM}
of \Vleo{eff}.

If and only if \Vleo{down} is a top-down cause of \Vleo{eff},
we also say the following:
\begin{itemize}
\item
\Vleo{eff} is the
\xdfn{effect}{effect!LEO, as the effect of another LEO}
of \Vleo{down}.
\item
\Veim{basis} is a
\xdfn{bottom-up cause}{bottom-up cause!EIM bottom-up cause of a LEO}%
\index{recce-definitions}{matching!incomplete EIM, of a LEO}
of \Vleo{eff}.
\item
\Vleo{down} and \Veim{basis} \qdfn{match}%
\index{recce-definitions}{match!between a LEO and an incomplete EIM}.
\end{itemize}
\end{definition}

In this monograph,
we will sometimes also call a valid Leo memo an
\xdfn{instantiated}{instantiated (Leo memo)}
Leo memo.

\begin{definition}
\label{def:validity-of-leo-memo}
\dtitle{Validity of an Leo memo}
Let \Vleo{eff} be a Leo memo,
\Vleo{eff} is
\xdfn{valid}{valid (Leo memo)}
if and only if the following hold:

\begin{itemize}
\item
There is a valid EIM,
call it \Veim{basis},
which is the basis of \Vleo{eff}.
\item
One of the following two cases are true.
\end{itemize}

The two cases are
based on whether or not \Veim{eff}
has a top-down cause.

\textbf{Case 1}:
In the first case,
\Vleo{eff} has
an instantiated top-down cause.
Let that top-down cause be \Vleo{down}.
This case holds if and only if
\begin{equation*}
\Vleo{eff} = \left[
  \begin{gathered}
  \Postdot{\Veim{basis}}, \DR{\Vleo{down}}, \\
  \Left{\Vleo{down}}, \Current{\Veim{basis}}
  \end{gathered}
\right].
\end{equation*}

\textbf{Case 2}:
In the second case,
there is no instantiated
top-down cause for \Vleo{eff}.
This case holds if and only if
\begin{equation*}
\Vleo{eff} = \left[
  \begin{gathered}
  \Postdot{\Veim{basis}},
  \Next{\DR{\Veim{basis}}}, \\
  \Left{\Veim{basis}}, \Current{\Veim{basis}}
  \end{gathered}
\right].
\end{equation*}
\vspace{.5ex} % extra space needed before end marker
\end{definition}

\begin{theorem}
\ttitle{Leo basis uniqueness by memo}
\label{t:leo-basis-uniqueness}
A valid Leo memo has exactly one valid basis.
\end{theorem}

\begin{proof}
An valid Leo memo must have at least one basis
\becuz{} \dref[validity of Leo memo]{def:validity-of-leo-memo}.
For the theorem,
it remains to show that a Leo memo cannot have more than
one basis.

Assume for a reductio that \Vleo{l} is a Leo memo
with two distinct basis EIM's, call them \Veim{bas1}
and \Veim{bas2}:
\begin{equation}
\tag{RAA}
\label{eq:leo-basis-uniqueness-5}
\Veim{bas1} \neq \Veim{bas2}.
\end{equation}
From \dref[basis of an Leo memo]{def:basis-of-leo-memo},
we know that
\begin{equation}
\label{eq:leo-basis-uniqueness-10}
\PLSY{\Veim{bas1}} = \LSY{\Vleo{l}} = \PLSY{\Veim{bas2}}.
\end{equation}
Because \Veim{bas1} is the basis of \Vleo{l},
\Veim{bas1} is Leo-eligible
\dref[basis of an Leo memo]{def:basis-of-leo-memo}.
Because \Veim{bas1} is Leo-eligible,
it must be postdot-unique
\dref[Leo-eligible]{def:leo-eligible}.
But \Veim{bas1} is not postdot-unique
\becuz{}
\eqref{eq:leo-basis-uniqueness-10},
\dref[postdot-unique]{def:postdot-unique}.
Therefore \Veim{bas1} is not the basis of a Leo memo
\dref[basis of an Leo memo]{def:basis-of-leo-memo}.
This is contrary to the assumption for the reductio
\eqref{eq:leo-basis-uniqueness-5}.
Therefore \Vleo{l} has at most one basis,
which is what remained
to show for the theorem.
\end{proof}

\begin{theorem}
\ttitle{Leo transition symbol is non-terminal}
\label{t:leo-transition-symbol-non-terminal}
The transition symbol of a valid Leo memo
must be a non-terminal other than the accept symbol.
\end{theorem}

\begin{proof}
By the definition of validity for a Leo memo,
the rule of the basis must be of the form
\begin{equation}
\label{eq:leo-transition-symbol-non-terminal-10}
\Vrule{r} = [ \Vsym{A} \de \Vstr{prefix} \Vsym{trans} \Vstr{nul} ],
\end{equation}
where $\Vstr{nul} = \epsilon$,
and
where
\begin{gather}
\label{eq:leo-transition-symbol-non-terminal-20}
\text{\Vrule{r} is Leo-eligible,} \\
\label{eq:leo-transition-symbol-non-terminal-23}
\text{and \Vsym{trans} is the transition symbol of the Leo memo.}
\end{gather}
By
\eqref{eq:leo-transition-symbol-non-terminal-20},
\Vrule{r} is Leo-eligible,
and therefore \Vrule{r} must be right-recursive.
By the definition of right-recursive,
\Vrule{r} is right-recursive only if
\Vsym{trans} is right-recursive.
To be right-recursive, \Vsym{trans}
must be a non-terminal.
By \eqref{eq:leo-transition-symbol-non-terminal-23},
\Vsym{trans} is the transition symbol,
and therefore the transition symbol must be a
non-terminal.

It remains
to show that $\Vsym{trans} \neq \Vsym{accept}$.
By its definition, \Vsym{accept} occurs only in one place ---
on the LHS of the accept rule.
Using this fact and
\eqref{eq:leo-transition-symbol-non-terminal-10},
we see that
$\Vsym{trans} \neq \Vsym{accept}$.
\end{proof}

% TODO -- deal more carefully with
% instantiation
% in a later revision
%
% we will want to allow for implementations which
% selectively omit valid Leo memos.
% We therefore will distinquish between
% valid Leo memos
% and
% All instantiated Leo memos are valid.
% A valid Leo memo may or may not be instantiated,
% depending on the implementation.

\begin{definition}
\dtitle{Matching Leo memo of an parse instance}
\label{def:inst-matching-leo-memo}
A Leo memo, call it \Vleo{l},
and an parse instance, call it \Vinst{i},
are said to
\xdfn{match}{match!between a LEO and an INST}
if and only if
\begin{gather*}
\LSY{\Vleo{l}} = \LSY{\Vinst{i}}.
\end{gather*}
We say that \Vleo{l} is a
\xdfn{matching}{matching!LEO, of an INST}
Leo memo of \Vinst{i}
and that \Vinst{i} is a
\xdfn{matching}{matching!INST, of a LEO}
EIM of \Vleo{l}.
We write $\Memo{\Vinst{i}} = \Vleo{l}$%
\index{recce-notation}{Memo@\myfnname{Memo}!\Vop{Memo}{\Vinst{i}} = \Vleo{l}}
to indicate that the Leo memo \Vleo{l} matches
the \Vinst{i}.
\end{definition}

\begin{definition}
\dtitle{Matching Leo memo of an EIM}
\label{def:eim-matching-leo-memo}
A Leo memo, call it \Vleo{l},
and a completed EIM, call it \Veim{e},
are said to
\xdfn{match}{match!between a LEO and a complete EIM}
if and only if
\[
\text{\Vleo{l} matches \SymEq{\Veim{e}}}.
\]
If \Veim{e}
\xdfn{matching}{matching!LEO, of a complete EIM}
Leo memo of \Veim{e}
and that \Veim{e} is a
\xdfn{matching}{matching!complete EIM, of a LEO}
EIM of \Vleo{l}.
We write $\Memo{\Veim{e}} = \Vleo{l}$%
\index{recce-notation}{Memo@\myfnname{Memo}!\Vop{Memo}{\Veim{e}} = \Vleo{l}}
to indicate that the Leo memo \Vleo{l} matches
the \Veim{e}.
\end{definition}

\begin{definition}
\dtitle{Quasi-matching Leo memo}
\label{def:quasi-matching-leo-memo}
A Leo memo, call it \Vleo{l},
and a quasi-complete EIM, call it \Veim{q},
are said to
\xdfn{quasi-match}{quasi-match!between a LEO and an EIM}
if and only if
\Vleo{l} matches the completion EIM of \Veim{q}.
We say that \Vleo{leo} is a
\xdfn{quasi-matching}{quasi-matching (LEO)!of an EIM}
Leo memo of \Veim{q}
and that \Veim{q} is a
\xdfn{quasi-matching}{quasi-matching (EIM)!of a LEO}
EIM of \Vleo{l}.
We write $\Memo{\Veim{q}} = \Vleo{l}$%
\index{recce-notation}{Memo@\myfnname{Memo}!\Vop{Memo}{\Veim{e}} = \Vleo{l}}
to indicate that the Leo memo \Vleo{l} matches
the \Veim{q}.
\end{definition}

\begin{theorem}
\ttitle{Matching Leo memo is quasi-matching}
\label{t:matching-leo-is-quasi-matching}
Let \Vleo{l} be a Leo memo which matches
an Earley item, call it \Veim{e}.
Then \Vleo{l} quasi-matches \Veim{e}.
\end{theorem}

\begin{proof}
TODO
Recall from
\dref[completion EIM of an EIM]{def:eim-dr-notions}
that the completion EIM of the quasi-complete EIM \Veim{q} is
\[
   \left[
   \begin{gathered}
     \big[ \Rule{\Veim{q}}, \Vdecr{\Vsize{\Rule{\Veim{q}}}} \big],
     \\
     \Left{\Veim{q}}, \Current{\Veim{q}}
   \end{gathered}
   \right].
\]
Note that, by
\dref{def:eim-matching-leo-memo}
and
\dref{def:quasi-matching-leo-memo},
that if a Leo memo matches an EIM,
also that Leo memo also quasi-matches that EIM.
\end{proof}

\begin{theorem}
\ttitle{Matching Leo memo is quasi-matching}
\label{t:quasi-matching-completion-is-matching}
Let \Vleo{l} be a Leo memo which quasi-matches
a completed Earley item, call it \Veim{e}.
Then \Vleo{l} matches \Veim{e}.
\end{theorem}

\begin{proof}
TODO
\end{proof}

\begin{theorem}
\ttitle{Fleeting closure quasi-match}
\label{t:leo-memo-fleeting closure}
Let \Veim{e1} and \Veim{e2} be EIM's
in the same fleeting closure,
and let
\Vleo{l}
be a Leo memo quasi-matching \Veim{e1}.
Then \Vleo{l} quasi-matches \Veim{e2}.
\end{theorem}

\begin{proof}
Let \var{fc} be the fleeting closure that contains
\Veim{e1} and \Veim{e2}.  Then
\begin{align}
\label{eq:leo-memo-fleeting closure-10}
& \myparbox{%
$\Veim{e1} \in \var{fc}$
\becuz{} WLOG, ASM for Th.
} \\
\label{eq:leo-memo-fleeting closure-12}
& \myparbox{%
$\Veim{e2} \in \var{fc}$
\becuz{} WLOG, ASM for Th.
} \\
\label{eq:leo-memo-fleeting closure-14}
& \myparbox{%
\Vleo{l} quasi-matches \Veim{e1}
\becuz{} ASM for Th.
} \\
\label{eq:leo-memo-fleeting closure-16}
& \myparbox{%
\Veim{e1} is quasi-complete
\becuz{} 
\eqref{eq:leo-memo-fleeting closure-14},
\dref[quasi-matching EIM]{def:quasi-matching-leo-memo},
} \\
\label{eq:leo-memo-fleeting closure-18}
& \myparbox{%
\Veim{e2} is quasi-complete
\becuz{} 
\eqref{eq:leo-memo-fleeting closure-10},
\eqref{eq:leo-memo-fleeting closure-12},
\eqref{eq:leo-memo-fleeting closure-16},
\tref{t:fleeting-closure-shares-quasi-completeness}.
} \\
\label{eq:leo-memo-fleeting closure-20}
& \myparbox{%
\Veim{e1} and \Veim{e2} share the same
EIM completion, call it \Veim{comp}
\becuz{} 
\eqref{eq:leo-memo-fleeting closure-10},
\eqref{eq:leo-memo-fleeting closure-12},
\eqref{eq:leo-memo-fleeting closure-16},
\eqref{eq:leo-memo-fleeting closure-18},
\tref{t:fc-shares-eim-completion}.
} \\
\label{eq:leo-memo-fleeting closure-22}
& \myparbox{%
\Vleo{l} matches \Veim{comp}
\becuz{}
\eqref{eq:leo-memo-fleeting closure-14},
\dref[quasi-matching EIM]{def:quasi-matching-leo-memo}.
} \\
\label{eq:leo-memo-fleeting closure-24}
& \myparbox{%
\Vleo{l} quasi-matches \Veim{e2}
\becuz{}
\eqref{eq:leo-memo-fleeting closure-20},
\eqref{eq:leo-memo-fleeting closure-22},
\dref{def:quasi-matching-leo-memo}.
\qedhere
}
\end{align}
\end{proof}

\begin{theorem}
\ttitle{Basis/top-down equivalence}
\label{t:basis-top-down-equivalence}
Let \Vinst{up} be a valid parse instance,
and let \Vleo{l} be an
instantiated Leo memo
that matches \Vinst{up}.
Let \Veim{down} be a valid EIM.
Then \Veim{down} matches \Vinst{up}
if and only if
\Veim{down} is a basis of \Vleo{l}.
\end{theorem}

\begin{proof}
By assumption for the theorem \Vleo{l} matches
\Vinst{up}, so that
\begin{align}
\label{eq:basis-top-down-equivalence-10}
& \myparbox{%
$\LSY{\Vleo{l}} = \LSY{\Vinst{up}}$
\becuz{}
\dref[EIM/LEO match]{def:eim-matching-leo-memo},
ASM for this theorem.
}
\intertext{%
\textbf{``If'' direction}:
}
\label{eq:basis-top-down-equivalence-12}
& \myparbox{%
\Veim{down} is a basis of \Vleo{l}
\becuz{}
ASM for the ``if'' direction.
} \\
\label{eq:basis-top-down-equivalence-14}
& \myparbox{%
$\PLSY{\Veim{down}} = \LSY{\Vleo{l}}$
\becuz{}
\eqref{eq:basis-top-down-equivalence-12},
\dref[basis of an Leo memo]{def:basis-of-leo-memo}.
} \\
\label{eq:basis-top-down-equivalence-16}
& \myparbox{%
$\PLSY{\Veim{down}} = \LSY{\Vinst{up}}$
\becuz
\eqref{eq:basis-top-down-equivalence-10},
\eqref{eq:basis-top-down-equivalence-14}.
} \\
\label{eq:basis-top-down-equivalence-18}
& \myparbox{%
\Veim{down} matches \Vinst{up}
\becuz{}
\eqref{eq:basis-top-down-equivalence-16},
\dref[matching causes]{def:matching-causes},
}
\intertext{%
where
\eqref{eq:basis-top-down-equivalence-18}
is what we needed to show the ``if'' direction.
}
\intertext{%
\textbf{``Only if'' direction}:
}
\label{eq:basis-top-down-equivalence-32}
& \myparbox{%
\Veim{down} matches \Vinst{up}
\becuz{}
ASM for the ``only if'' direction.
} \\
\label{eq:basis-top-down-equivalence-34}
& \myparbox{%
$\PLSY{\Veim{down}} = \LSY{\Vinst{up}}$
\becuz{}
\eqref{eq:basis-top-down-equivalence-32},
\dref[matching causes]{def:matching-causes},
} \\
\label{eq:basis-top-down-equivalence-36}
& \myparbox{%
$\PLSY{\Veim{down}} = \LSY{\Vleo{l}}$
\becuz
\eqref{eq:basis-top-down-equivalence-10},
\eqref{eq:basis-top-down-equivalence-34}.
} \\
\label{eq:basis-top-down-equivalence-38}
& \myparbox{%
\Veim{down} is a basis of \Vleo{l}
\becuz{}
\eqref{eq:basis-top-down-equivalence-36},
\dref[basis of an Leo memo]{def:basis-of-leo-memo},
}
\end{align}
With
\eqref{eq:basis-top-down-equivalence-18}
and
\eqref{eq:basis-top-down-equivalence-38}
we have both directions and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Properties of LEO-EIM matches}
\label{t:leo-match-props}
We make the following assumptions:
\begin{subequations}
\renewcommand{\theequation}{A\arabic{equation}}
\begin{align}
\label{eq:leo-match-props-asm-1}
& \myparbox{%
\Veim{e} is a valid EIM.
} \\
\label{eq:leo-match-props-asm-2}
& \myparbox{%
\Vleo{l} is an instantiated Leo memo.
} \\
\label{eq:leo-match-props-asm-3}
& \myparbox{%
\Vleo{l} matches \Veim{e}.
}
\end{align}
\end{subequations}

On those assumptions,
we have the following:
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:leo-match-props-req-1}
& \myparbox{%
\Vleo{l}
has exactly one valid basis,
call it \Veim{bas}.
} \\
\label{eq:leo-match-props-req-2}
& \myparbox{%
\Veim{bas} is the only matching top-down cause
of \Veim{e}.
} \\
\label{eq:leo-match-props-req-3}
& \myparbox{%
\Veim{e} is not the top-down cause of any effect.
} \\
\label{eq:leo-match-props-req-4}
& \myparbox{%
The cause-pair
$[ \Veim{bas}, \Veim{e} ]$
is the cause of exactly one valid effect,
call it \Veim{eff}.
} \\
\label{eq:leo-match-props-req-5}
& \myparbox{%
\Veim{e} is the cause of exactly one valid
effect, \Veim{eff}.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
By assumption for the theorem,
\begin{align}
\label{eq:leo-match-props-5}
& \myparbox{%
\Vleo{l}
has exactly one valid basis,
call it \Veim{bas}
\becuz{}
\tref{t:leo-basis-uniqueness},
which is 
Requirement~\eqref{eq:leo-match-props-req-1}
of this theorem.
} \\
\label{eq:leo-match-props-8}
& \myparbox{%
\Veim{bas} is the only matching top-down cause of \Veim{e}
\becuz{}
\eqref{eq:leo-match-props-asm-1},
\eqref{eq:leo-match-props-asm-2},
\eqref{eq:leo-match-props-asm-3},
\eqref{eq:leo-match-props-5},
\tref{t:basis-top-down-equivalence},
which is Requirement
\eqref{eq:leo-match-props-req-2}
of this theorem.
} \\
\label{eq:leo-match-props-9}
& \myparbox{%
\Veim{e} is a completed EIM
\becuz{}
\eqref{eq:leo-match-props-asm-3},
\eqref{eq:leo-match-props-5},
\dref[matching EIM of a Leo memo]{def:inst-matching-leo-memo}.
} \\
\label{eq:leo-match-props-12}
& \myparbox{%
\Veim{e} is not the top-down cause of any effect
\becuz{}
\eqref{eq:leo-match-props-9},
\tref{t:completed-eim-as-a-cause},
which is Requirement
\eqref{eq:leo-match-props-req-3}
of this theorem.
} \\
\label{eq:leo-match-props-14}
& \myparbox{%
The cause-pair
$[ \Veim{bas}, \Veim{e} ]$
is the cause of exactly one valid effect,
call it \Veim{eff}
\becuz{}
\eqref{eq:leo-match-props-8},
\tref{t:effect-from-symbolic-cause-pair},
which is Requirement
\eqref{eq:leo-match-props-req-4}
of this theorem.
} \\
\label{eq:leo-match-props-16}
& \myparbox{%
\Veim{e} is the cause of exactly one valid
effect, \Veim{eff}
\becuz{}
\eqref{eq:leo-match-props-8},
\eqref{eq:leo-match-props-9},
\tref{t:completed-eim-as-a-cause},
\eqref{eq:leo-match-props-14},
which is Requirement
\eqref{eq:leo-match-props-req-5}
of this theorem. \qedhere
}
\end{align}
\end{proof}

\chapter{Leo catenas}

\begin{definition}
\dtitle{Leo catena}
\label{def:leo-catena}
A
\dfn{Leo catena},
also called simply a
\dfn{catena},
is a sequence of Leo memos,
where each element of the sequence
is the top-down cause of the previous element.
A catena is
\xdfn{maximal}{maximal!catena}
if and only if its last element has no top-down cause.
Where \Vleo{l} is a Leo memo,
we say that the
\xdfn{catena}{catena!wrt a Leo memo}
of \Vleo{l} is the maximal catena whose first element
is \Vleo{l}.
\end{definition}

\begin{lemma}
\ltitle{Leo catena non-increasing location}
\label{lem:leo-catena-non-increasing-location}
The current location of the Leo memos in a Leo catena
is non-increasing.
\end{lemma}

\begin{proof}
Let \var{cat} be a catena.
so that
For all \var{a},
where \Veim{bas} is the basis of \Vel{cat}{a},
\begin{align}
\label{eq:lem-leo-catena-non-increasing-location-5}
& \myparbox{\el{cat}{\Vincr{a}}
is the top-down cause of
\Vel{cat}{a}
\becuz{}
\dref[catena]{def:leo-catena};
}
\\
\label{eq:lem-leo-catena-non-increasing-location-10}
& \myparbox{
$\Current{\Vel{cat}{a}} = \Current{\Veim{bas}}$
\becuz{} \dref[basis of a Leo memo]{def:basis-of-leo-memo}; and
}
\\
\label{eq:lem-leo-catena-non-increasing-location-15}
&
\myparbox{
$\Current{\el{cat}{\Vincr{a}}} = \Left{\Veim{bas}}$
\becuz{} \dref[top-down cause of a Leo memo]{def:down-cause-of-leo-memo}.
}
\intertext{The current location of every EIM is at or after
its origin, so that}
\label{eq:lem-leo-catena-non-increasing-location-20}
& \forall \; \Veim{x} : \Left{\Veim{x}} \le \Current{\Veim{x}}
\; \text{and}
\\
\label{eq:lem-leo-catena-non-increasing-location-22}
& \myparbox{
$\Current{\Vel{cat}{a}} \ge \Current{\el{cat}{\Vincr{a}}}$
\becuz{} \eqref{eq:lem-leo-catena-non-increasing-location-10},
\eqref{eq:lem-leo-catena-non-increasing-location-15},
\eqref{eq:lem-leo-catena-non-increasing-location-20}.
}
\end{align}
The lemma follows from
\eqref{eq:lem-leo-catena-non-increasing-location-22}.
\end{proof}

\begin{lemma}
\ltitle{Leo catena cycle}
\label{lem:leo-catena-cycle}
In a Leo catena,
no two distinct elements
share the same locsym.
\end{lemma}

\begin{proof}
Let \var{cat} be a catena.
Assume, for a reductio, that
\begin{equation}
\label{eq:lem-leo-catena-cycle-5}
\tag{RAA}
\exists \; \var{x}, \var{y} : 
\left(
\begin{gathered}
\var{x} \neq \var{y} \\
\land \; \Current{\Vel{cat}{x}} = \Current{\Vel{cat}{y}} \\
\land \; \Symbol{\Vel{cat}{x}} = \Symbol{\Vel{cat}{y}}
\end{gathered}
\right).
\end{equation}

The current location of a catena is non-increasing
\lemref{lem:leo-catena-non-increasing-location}.
Therefore all the elements of cat with the same current location
are in a consecutive subsequence of cat.
Without loss of generalization,
we let the current location be \Vloc{curr},
and we let \var{a}, \var{b} be such that
\begin{equation}
\label{eq:lem-leo-catena-cycle-8}
\begin{multlined}
\forall \; \var{i} :
(\var{a} \le \var{i} \le \var{b}
\equiv \Current{\Vel{cat}{i}} = \Vloc{curr})
\end{multlined}
\end{equation}
Since the choice of \var{x}, \var{y} in 
\eqref{eq:lem-leo-catena-cycle-5}
is arbitrary, we assume without loss
of generality that
\begin{equation}
\label{eq:lem-leo-catena-cycle-8b}
\var{x} \neq \var{y} \implies \var{x} < \var{y}.
\end{equation}
Combining
\eqref{eq:lem-leo-catena-cycle-5},
\eqref{eq:lem-leo-catena-cycle-8}
and \eqref{eq:lem-leo-catena-cycle-8b},
we know that our reductio requires that
there is \var{x}, \var{y} such that
\begin{equation}
\label{eq:lem-leo-catena-cycle-8d}
\exists \; \var{x}, \var{y} : 
(\var{a} \le \var{x} < \var{y} \le \var{b}
\; \land \; \Symbol{\Vel{cat}{x}} = \Symbol{\Vel{cat}{y}}).
\end{equation}

If $\var{a} = \var{b}$, our assumption for the reductio
\eqref{eq:lem-leo-catena-cycle-5} is trivially false.
Therefore
$\var{a} < \var{b}$.
We now consider some \var{i} such that
\begin{align}
\label{eq:lem-leo-catena-cycle-8-1}
& \var{a} \le \var{i} < \var{b},
\intertext{where \var{i} is
otherwise without loss of generality, so that}
\label{eq:lem-leo-catena-cycle-9}
& \myparbox{
\el{cat}{\Vincr{i}}
is the top-down cause
of
\Vel{cat}{i}
\becuz{} \dref[catena]{def:leo-catena};
}
\\
\label{eq:lem-leo-catena-cycle-9b}
& \var{a} \le \var{i} < \Vincr{i} \le \var{b}
\becuz \eqref{eq:lem-leo-catena-cycle-8-1};
\\
\label{eq:lem-leo-catena-cycle-10}
& \Current{\Vel{cat}{i}} = \Current{\el{cat}{\Vincr{i}}}
\becuz
\eqref{eq:lem-leo-catena-cycle-8},
\eqref{eq:lem-leo-catena-cycle-9b};
\\
\label{eq:lem-leo-catena-cycle-12}
& \myparbox{
\Vel{cat}{i} has a unique basis, call it \Veim{bas}
\becuz{} \tref{t:leo-basis-uniqueness};
}
\\
\label{eq:lem-leo-catena-cycle-14}
& \myparbox{$\Current{\el{cat}{\Vincr{i}}} = \Left{\Veim{bas}}$
\becuz{}
\eqref{eq:lem-leo-catena-cycle-9},
\eqref{eq:lem-leo-catena-cycle-12},
\dref[top-down cause of Leo memo]{def:down-cause-of-leo-memo};
}
\\
\label{eq:lem-leo-catena-cycle-16}
& \myparbox{$\Current{\Vel{cat}{i}} = \Current{\Veim{bas}}$
\becuz{}
\eqref{eq:lem-leo-catena-cycle-12},
\dref[basis of a Leo memo]{def:basis-of-leo-memo};
}
\\
\label{eq:lem-leo-catena-cycle-18}
& \myparbox{$\Current{\Veim{bas}} = \Left{\Veim{bas}}$
\becuz{}
\eqref{eq:lem-leo-catena-cycle-10},
\eqref{eq:lem-leo-catena-cycle-14},
and \eqref{eq:lem-leo-catena-cycle-16};
}
\\
\label{eq:lem-leo-catena-cycle-20}
& \myparbox{\Veim{bas} is a quasi-prediction
\becuz{}
\eqref{eq:lem-leo-catena-cycle-18};
}
\\
\label{eq:lem-leo-catena-cycle-22}
& \myparbox{\Veim{bas} is a quasi-penult
\becuz{}
\eqref{eq:lem-leo-catena-cycle-12},
\dref[basis of a Leo memo]{def:basis-of-leo-memo};
}
\\
\label{eq:lem-leo-catena-cycle-24}
& \myparbox{$\Symbol{\el{cat}{\Vincr{i}}} = \LHS{\Veim{bas}}$
\becuz{}
\eqref{eq:lem-leo-catena-cycle-9},
\eqref{eq:lem-leo-catena-cycle-12}
\dref[top-down cause of Leo memo]{def:down-cause-of-leo-memo};
}
\\
\label{eq:lem-leo-catena-cycle-26}
& \myparbox{$\Symbol{\Vel{cat}{i}} = \Postdot{\Veim{bas}}$
\becuz{}
\eqref{eq:lem-leo-catena-cycle-12},
\dref[basis of a Leo memo]{def:basis-of-leo-memo};
}
\\
\label{eq:lem-leo-catena-cycle-28}
& \begin{aligned}
& \Rule{\Veim{bas}} =
\left[
\begin{multlined}
\Symbol{\el{cat}{\Vincr{i}}}
\de
\\
\quad \Vstr{nul1}
\Cat
\Symbol{\Vel{cat}{i}}
\Cat
\Vstr{nul2}
\end{multlined}
\right]
\\
& \qquad \qquad \text{where $\Vstr{nul1} \destar \epsilon$
  and $\Vstr{nul2} \destar \epsilon$
}
\\
& \qquad \qquad \becuz
\text{
  \eqref{eq:lem-leo-catena-cycle-20},
  \eqref{eq:lem-leo-catena-cycle-22},
  \eqref{eq:lem-leo-catena-cycle-24},
  \eqref{eq:lem-leo-catena-cycle-26};
  and
}
\end{aligned}
\\
\label{eq:lem-leo-catena-cycle-30}
& \Symbol{\Vel{cat}{\Vincr{i}}} \xderives{1} \Symbol{\Vel{cat}{i}}
\becuz \eqref{eq:lem-leo-catena-cycle-28}.
\end{align}

By
\eqref{eq:lem-leo-catena-cycle-8-1} and
\eqref{eq:lem-leo-catena-cycle-30},
we have that,
for every \var{i} such that
$\var{a} \le \var{i} < \var{b}$,
\[
\Symbol{\Vel{cat}{\Vincr{i}}} \xderives{1} \Symbol{\Vel{cat}{i}}.
\]
From this, we see that
for every \var{i}, \var{j} such that
$\var{a} \le \var{i} < \var{j} \le \var{b}$,
\begin{equation}
\label{eq:lem-leo-catena-cycle-36}
\Symbol{\Vel{cat}{j}} \deplus \Symbol{\Vel{cat}{i}}. \\
\end{equation}
Instantiating 
\eqref{eq:lem-leo-catena-cycle-36} with \var{x} and \var{y}
from
\eqref{eq:lem-leo-catena-cycle-8d},
we have
\begin{equation}
\label{eq:lem-leo-catena-cycle-39}
\Symbol{\Vel{cat}{y}} \deplus \Symbol{\Vel{cat}{x}}.
\end{equation}
But from
\eqref{eq:lem-leo-catena-cycle-8d}
we also know that
\begin{gather*}
 \Symbol{\Vel{cat}{x}} = \Symbol{\Vel{cat}{y}},
\end{gather*}
so that
\eqref{eq:lem-leo-catena-cycle-39}
is a cycle.
Cycles are forbidden in Marpa grammars.
This is a contradiction, which shows the reductio,
and with it,
the theorem.
\end{proof}

\begin{theorem}
\ttitle{Leo catena elements share common dotted rule and origin}
\label{t:catena-top-elements-identical}
In a catena, the dotted rule and origin elements
of every element are the same.
That is,
if \var{cat} is a catena,
then for all \var{a}, \var{b}
such that $0 \le \var{a} \le \Vlastix{cat}$
and $0 \le \var{b} \le \Vlastix{cat}$,
\begin{equation*}
\DR{\Vel{cat}{a}} = \DR{\Vel{cat}{b}}
\; \land \;
\Left{\Vel{cat}{a}} = \Left{\Vel{cat}{b}}
\end{equation*}
\end{theorem}

\begin{proof}
We assume for a reductio that there is a catena,
call it \var{cat},
such that
\begin{equation}
\tag{RAA}
\label{eq:catena-top-elements-identical-10}
\exists \; \var{x} :
\left(
\begin{gathered}
\DR{\Vel{cat}{x}} \neq \DR{\el{cat}{0}} \\
\lor \; \Left{\Vel{cat}{x}} \neq \Left{\el{cat}{0}}
\end{gathered}
\right).
\end{equation}
Let \var{x1} be the first value which can instantiate
\var{x} in 
\eqref{eq:catena-top-elements-identical-10}.
Trivially, we see that $\var{x1} > 0$,
so that
$\el{cat}{\Vdecr{x1}} \neq \undefined$ and,
since
\begin{align}
\label{eq:catena-top-elements-identical-19}
& \myparbox{
\el{cat}{\Vdecr{x1}} is before the first
value that can instantiate \var{x}
in \eqref{eq:catena-top-elements-identical-10},
we have
}
\\
\label{eq:catena-top-elements-identical-20b}
& \DR{\el{cat}{\Vdecr{x1}}} = \DR{\el{cat}{0}}
\becuz \eqref{eq:catena-top-elements-identical-19};
\\
\label{eq:catena-top-elements-identical-20d}
& \Left{\el{cat}{\Vdecr{x1}}} = \Left{\el{cat}{0}}
\becuz \eqref{eq:catena-top-elements-identical-19};
\\
\label{eq:catena-top-elements-identical-22}
& \myparbox{
\Vel{cat}{x1}
is the top-down cause
of
\el{cat}{\Vdecr{x1}}
\becuz{} \dref[catena]{def:leo-catena};
}
\\
\label{eq:catena-top-elements-identical-24b}
&
\myparbox{
\DR{\Vel{cat}{x1}} = \DR{\el{cat}{\Vdecr{x1}}}
\becuz{}
\dref[validity of Leo memo with top-down cause]{def:validity-of-leo-memo};
}
\\
\label{eq:catena-top-elements-identical-24d}
&
\myparbox{
\Left{\Vel{cat}{x1}} = \Left{\el{cat}{\Vdecr{x1}}}
\becuz{}
\dref[validity of Leo memo with top-down cause]{def:validity-of-leo-memo};
}
\\
\label{eq:catena-top-elements-identical-26b}
&
\DR{\Vel{cat}{x1}} = \DR{\el{cat}{0}}
\becuz \eqref{eq:catena-top-elements-identical-20b},
\eqref{eq:catena-top-elements-identical-24b};
\; \text{and}
\\
\label{eq:catena-top-elements-identical-26d}
& \Left{\Vel{cat}{x1}} = \Left{\el{cat}{0}}
\becuz \eqref{eq:catena-top-elements-identical-20d}
\eqref{eq:catena-top-elements-identical-24d}.
\end{align}
\eqref{eq:catena-top-elements-identical-26b}
and
\eqref{eq:catena-top-elements-identical-26d}
show that \var{x1} cannot instantiate \var{x} in
\eqref{eq:catena-top-elements-identical-10}.
Since we defined \var{x1} as the first value which
can instantiate \var{x} in
\eqref{eq:catena-top-elements-identical-10},
that means there is no value that
can instantiate \var{x} in
\eqref{eq:catena-top-elements-identical-10},
and therefore that
\eqref{eq:catena-top-elements-identical-10}
is false.
This shows the reductio and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Catena element uniqueness}
\label{catena-element-uniqueness}
Every element of a contena is distinct.
\end{theorem}

\begin{proof}
This theorem follows from Lemma
\ref{lem:leo-catena-cycle}.
\end{proof}

\begin{theorem}
\ttitle{Leo catenas are finite}
\label{t:leo-catenas-are-finite}
Every Leo catena has a finite length.
\end{theorem}

\begin{proof}
Let \var{cat} be a catena,
and let $\Current{\el{cat}{0}} = \var{i}$.
No element of \var{cat} occurs twice
\tref{catena-element-uniqueness}.
Therefore, if the number of possible distinct
catena elements in \var{cat} is finite, 
the length of \var{cat} is finite.
It remains to show that the number of possible distinct
catena elements is finite.

By Lemma
\ref{lem:leo-catena-non-increasing-location},
the location of the elements of \var{cat} is non-increasing,
so that
\begin{equation}
\myparbox{
\label{eq:leo-catenas-are-finite-10}
elements of \var{cat}
have at most \Vincr{i} distinct locations.
}
\end{equation}
By Lemma
\ref{lem:leo-catena-cycle},
if any two catena elements
are distinct, but at a single location,
they cannot share the same transition symbol.
The number of symbols in a Marpa grammar is a fixed
constant that depends on the grammar.
Let the number of symbols in \Cg{} be \var{sym-cnt}.
From this and
\eqref{eq:leo-catenas-are-finite-10},
we see that there are at most
$(\Vincr{i}) \times \var{sym-cnt}$ distinct elements in \var{cat}.
\end{proof}

\begin{theorem}
\ttitle{Leo top-down uniqueness}
\label{t:leo-down-uniqueness}
Every valid Leo memo has at most one top-down cause.
\end{theorem}

\begin{proof}
Let
\begin{equation}
\label{eq:leo-down-uniqueness-10}
\Vleo{eff} = [ \Vsym{sym}, \Vdr{dr}, \Vloc{orig}, \Vloc{curr} ]
\end{equation}
be a Leo memo.
Assume, for a reductio,
that \Vleo{eff} has two distinct top-down causes.
Let these be
\begin{gather}
\label{eq:leo-down-uniqueness-13}
\Vleo{cuz1} = [ \Vsym{sym1}, \Vdr{dr1}, \Vloc{orig1}, \Vloc{curr1} ] \quad \text{and} \\
\label{eq:leo-down-uniqueness-16}
\Vleo{cuz2} = [ \Vsym{sym2}, \Vdr{dr2}, \Vloc{orig2}, \Vloc{curr2} ].
\end{gather}
\Vleo{cuz1} and \Vleo{cuz2} are, by assumption for
the reductio,
top-down causes of \Vleo{eff}.
Applying 
the definition of validity for a Leo memo with a top-down cause
\dref[validity of a Leo memo]{def:validity-of-leo-memo}
to \Vleo{eff},
and
using
\eqref{eq:leo-down-uniqueness-10},
\eqref{eq:leo-down-uniqueness-13}
and
\eqref{eq:leo-down-uniqueness-16},
we see that
\begin{gather*}
\Vdr{dr} = \Vdr{dr1} \; \land \; \Vdr{dr} = \Vdr{dr2} \quad \text{and} \\
\Vloc{orig} = \Vloc{orig1} \; \land \; \Vloc{orig} = \Vloc{orig2}
\end{gather*}
and therefore
\begin{equation}
\label{eq:leo-down-uniqueness-20}
\Vdr{dr1} = \Vdr{dr2} \; \land \; \Vloc{orig1} = \Vloc{orig2}.
\end{equation}
From Theorem
\ref{t:leo-basis-uniqueness},
we know that \Vleo{eff} has a unique basis,
call it \Veim{bas}.
By \dref[Leo top-down cause]{def:down-cause-of-leo-memo},
we know that
\begin{gather*}
\LHS{\Veim{bas}} = \Vsym{sym1} \; \land \; \LHS{\Veim{bas}} = \Vsym{sym2} \quad \text{and} \\
\Left{\Veim{bas}} = \Vloc{curr1} \; \land \; \Left{\Veim{bas}} = \Vloc{curr2}.
\end{gather*}
so that
\begin{equation}
\label{eq:leo-down-uniqueness-25}
\Vsym{sym1} = \Vsym{sym2} \; \land \; \Vloc{curr1} = \Vloc{curr2}.
\end{equation}
From
\eqref{eq:leo-down-uniqueness-13},
\eqref{eq:leo-down-uniqueness-16},
\eqref{eq:leo-down-uniqueness-20}
and
\eqref{eq:leo-down-uniqueness-25},
we have
\[
\Vleo{cuz1} = \Vleo{cuz2}.
\]
But we assumed for the reductio that \Vleo{cuz1}
and \Vleo{cuz2} are distinct.
So this gives us the reductio and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Memo catena uniqueness}
\label{t:memo-catena-uniqueness}
The catena of a Leo memo is unique.
\end{theorem}

\begin{proof}
Let \Vleo{l} be a Leo memo.
Assume for a reductio that \Vleo{l}
has two distinct catenas,
\var{cat1} and \var{cat2},
so that
\begin{equation}
\label{t:memo-catena-uniqueness-5}
\el{cat1}{0} = \Vleo{l} = \Vel{cat2}{0}.
\end{equation}
Since \var{cat1} and \var{cat2} differ,
we know that
\[
\exists \; \var{ix} : \Vel{cat1}{ix} \neq \Vel{cat2}{ix}.
\]
Recall our convention that $\Vel{seq}{i} = \undefined$
if $\var{i} > \Vlastix{seq}$.

Let \var{ix1} be the first index
in which \var{cat1} and \var{cat2} differ.
We know from 
\eqref{t:memo-catena-uniqueness-5}
that $\var{ix1} > 0$, and therefore we have
\begin{gather}
\label{t:memo-catena-uniqueness-20}
\el{cat1}{\Vdecr{ix1}} = \el{cat2}{\Vdecr{ix1}} \; \text{and}
\\
\label{t:memo-catena-uniqueness-23}
\Vel{cat1}{ix1} \neq \Vel{cat2}{ix1}.
\end{gather}

By \tref{t:leo-down-uniqueness},
we know that every catena element has
at most one top-down cause.
Let
\begin{gather}
\label{t:memo-catena-uniqueness-25a}
\text{\Vleo{down1} be the top-down cause of
\el{cat1}{\Vdecr{ix1}} and}
\\
\label{t:memo-catena-uniqueness-25b}
\text{\Vleo{down2} be the top-down cause of
\el{cat2}{\Vdecr{ix1}}.}
\end{gather}
Recall our convention that $\Vleo{down1} = \undefined$ if 
\el{cat1}{\Vdecr{ix1}}
has no top-down cause and
$\Vleo{down2} = \undefined$ if 
\el{cat2}{\Vdecr{ix1}}
has no top-down cause.
By the definition of a catena,
\begin{equation}
\label{t:memo-catena-uniqueness-28}
\Vel{cat1}{ix1} = \Vleo{down1} \land \Vel{cat2}{ix1} = \Vleo{down2},
\end{equation}
From
\eqref{t:memo-catena-uniqueness-20},
\eqref{t:memo-catena-uniqueness-25a},
\eqref{t:memo-catena-uniqueness-25b}
and \eqref{t:memo-catena-uniqueness-28},
we see that
\begin{equation}
\label{t:memo-catena-uniqueness-30}
\Vel{cat1}{ix1} = \Vel{cat2}{ix1}.
\end{equation}
contrary to \eqref{t:memo-catena-uniqueness-23}.
This contradiction shows the reductio.
We conclude that \var{cat1} and \var{cat2}
are identical.
\end{proof}

\begin{theorem}
\ttitle{Leo memos are unique by locsym}
\label{t:leo-memo-uniqueness-by-locsym}
Let \Vsym{A} be a symbol in a grammar
and \Vloc{i} a location in a parse.
There is at most one instantiated Leo memo with
symbol \Vsym{A} at location \Vloc{i}.
That is,
for all
\Vleo{l1}, \Vleo{l2} :
\begin{gather*}
\neg \Instantiated{\Vleo{l1}} \lor \; \neg \Instantiated{\Vleo{l2}} \\
\lor \; \Current{\Vleo{l1}} \neq \Current{\Vleo{l2}} \\
\lor \; \Symbol{\Vleo{l1}} \neq \Symbol{\Vleo{l2}}.
\end{gather*}
\end{theorem}

\begin{proof}
We assume, for a reductio, that there is
an instantiated Leo memo, call it \Vleo{l}, whose
locsym is identical to some
another instantiated Leo memo, call it \Vleo{l2},
where $\Vleo{l} \neq \Vleo{l2}$.
Every Leo memo is in a catena, even if it is only a
trivial catena of length 1.
So let \var{cat} be a catena that contains \Vleo{l2}.
Our assumption for the reductio can then be written as
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-10}
\tag{RAA}
\begin{gathered}
\exists \; \Vleo{l} \; \exists \; \var{ix} : \Instantiated{\Vleo{l}} \\
  \land \; \Symbol{\Vel{cat}{ix}} = \Symbol{\Vleo{l}} \\
  \land \; \Current{\Vel{cat}{ix}} = \Current{\Vleo{l}} \\
  \land \; \Vel{cat}{ix} \neq \Vleo{l}.
\end{gathered}
\end{equation}

A Leo catena is finite in length
\tref{t:leo-catenas-are-finite}.
Therefore, if any \var{ix} satisfies
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10},
then there is a last \var{ix} that satisfies
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10}.
Let the last \var{ix} that satisfies
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10}
be \var{z}.

We note that,
by \eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10}
and Lemma \ref{lem:leo-basis-locsym-uniqueness},
\Vel{cat}{z} and \Vleo{l} have the same basis.
Call this basis, \Veim{bas}.

\Vel{cat}{z} has at most one top-down cause
\tref{t:leo-down-uniqueness}.
Call this top-down cause \Vleo{down}.
In keeping with our convention in this monograph,
$\Vleo{down} = \undefined$ if
the top-down cause
of \Vel{cat}{z} does not exist.

Since 
\Vel{cat}{z} and \Vleo{l} have the same basis,
every top-down cause of
\Vel{cat}{z}
is also a top-down cause of \Vleo{l}
\dref[Leo top-down cause]{def:down-cause-of-leo-memo}.
Therefore
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-12}
\text{\Vleo{down} is the top-down cause of both \Vel{cat}{z} and \Vleo{l}.}
\end{equation}
Note that $\Vleo{down} \neq \undefined$ if and only if
\Vleo{l} has a top-down cause.

Assume for an inner reductio that
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-13}
\tag{RAA1}
\var{z} = \Vlastix{cat}.
\end{equation}
Then \Vel{cat}{z} has no top-down cause
\dref[catena]{def:leo-catena}.
Therefore, using
\dref[validity of Leo memo with no top-down cause]{def:validity-of-leo-memo}
and \eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10},
we have
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-16}
\Vel{cat}{z} = \left[
\begin{gathered}
  \Symbol{\Vleo{l}}, \Next{\DR{\Veim{bas}}}, \\
  \Left{\Veim{bas}}, \Current{\Vleo{l}}
\end{gathered}
\right].
\end{equation}
And since from
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-12}
we know that
\Vleo{l} also has no top-down cause, we have
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-19}
\begin{gathered}
\DR{\Vleo{l}} = \Next{\DR{\Veim{bas}}} \; \text{and} \\
\Left{\Vleo{l}} = \Left{\Veim{bas}}.
\end{gathered}
\end{equation}

From
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-16}
and \eqref{eq:leo-memo-uniqueness-by-postdot-locsym-19},
we know that
\[
  \Vleo{l} = \Vel{cat}{z}.
\]
This contradicts
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10}
and shows the inner reductio.
From the inner reductio we conclude that
\begin{align}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-22}
& 0 \le \var{z} < \Vlastix{cat}, \; \text{so that}
\\
\label{eq:leo-memo-uniqueness-by-postdot-locsym-23b}
& \text{\el{cat}{\Vincr{z}} exists
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-22}; and
}
\\
\label{eq:leo-memo-uniqueness-by-postdot-locsym-23d}
& \el{cat}{\Vincr{z}} = \Vleo{down} \neq \undefined
\becuz
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-23b},
\dref[catena]{def:leo-catena}.
\end{align}
Therefore, using
\dref[validity of Leo memo with top-down cause]{def:validity-of-leo-memo},
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10},
and \eqref{eq:leo-memo-uniqueness-by-postdot-locsym-23d}
we have
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-25}
\Vel{cat}{z} = \left[
\begin{gathered}
  \Symbol{\Vleo{l}}, \DR{\Vleo{down}}, \\
  \Left{\Vleo{down}}, \Current{\Vleo{l}}
\end{gathered}
\right].
\end{equation}
And by
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-12}
and \dref[validity of Leo memo with top-down cause]{def:validity-of-leo-memo},
\begin{equation}
\label{eq:leo-memo-uniqueness-by-postdot-locsym-28}
\begin{gathered}
\DR{\Vleo{l}} = \DR{\Vleo{down}} \; \text{and} \\
\Left{\Vleo{l}} = \Left{\Vleo{down}}.
\end{gathered}
\end{equation}
From
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-25}
and \eqref{eq:leo-memo-uniqueness-by-postdot-locsym-28},
we again have that
\[
  \Vleo{l} = \Vel{cat}{z},
\]
which again
contradicts
\eqref{eq:leo-memo-uniqueness-by-postdot-locsym-10}
and again shows a reductio, this time the outer one.
With the outer reductio, we have the theorem.
\end{proof}

\begin{theorem}
\ttitle{Leo memo uniqueness by basis}
\label{t:leo-memo-uniqueness-by-basis}
A valid EIM is the basis of at most one valid Leo memo.
\end{theorem}

\begin{proof}
For a reductio, assume that
\Veim{e} is a valid EIM that is the basis of two
distinct Leo memos, call them \Vleo{l1} and \Vleo{l2},
so that
\begin{equation}
\label{eq:leo-memo-uniqueness-by-basis-5}
\tag{RAA}
\Vleo{l1} \neq \Vleo{l2}.
\end{equation}
From \dref[basis of an Leo memo]{def:basis-of-leo-memo},
we know that
\begin{gather}
\notag
\LSY{\Vleo{l1}} = \PLSY{\Veim{bas1}} = \LSY{\Vleo{l2}}
\\
\label{eq:leo-memo-uniqueness-by-basis-10}
\therefore \LSY{\Vleo{l1}} = \LSY{\Vleo{l2}}.
\end{gather}
But from
\tref{t:leo-memo-uniqueness-by-locsym}
we know that
\begin{align}
\label{eq:leo-memo-uniqueness-by-basis-20}
& \LSY{\Vleo{l1}} = \LSY{\Vleo{l2}} \implies \Vleo{l1} = \Vleo{l2}.
\\
\label{eq:leo-memo-uniqueness-by-basis-22}
& \Vleo{l1} = \Vleo{l2} \becuz
\eqref{eq:leo-memo-uniqueness-by-basis-10},
\eqref{eq:leo-memo-uniqueness-by-basis-20}.
\end{align}
Equation \eqref{eq:leo-memo-uniqueness-by-basis-22}
contradicts 
\eqref{eq:leo-memo-uniqueness-by-basis-5},
which shows the reductio and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Leo memo uniqueness}
\label{t:leo-memos-match-uniquely}
Every EIM has at most one matching Leo memo.
\end{theorem}

\begin{proof}
Suppose, for a reductio,
that two distinct Leo memos match a single EIM.
Let, without loss of generality, the Leo memos be
\begin{gather*}
\Vleo{l1} = [ \Vsym{sym1}, \Vdr{dr1}, \Vorig{orig1}, \Vloc{curr1} ] \quad \text{and} \\
\Vleo{l2} = [ \Vsym{sym2}, \Vdr{dr2}, \Vorig{orig2}, \Vloc{curr2} ].
\end{gather*}
and let the EIM be \Veim{eim}.
Then
\begin{align}
\label{eq:leo-memos-match-uniquely-10}
& \myparbox{
$\Symbol{\Vleo{l1}} = \LHS{\Veim{eim}}$
\becuz{}
\dref[matching Leo memo]{def:eim-matching-leo-memo};
}
\\
\label{eq:leo-memos-match-uniquely-12}
& \myparbox{
$\Current{\Vleo{l1}} = \Left{\Veim{eim}}$
\becuz{}
\dref{def:eim-matching-leo-memo};
}
\\
\label{eq:leo-memos-match-uniquely-14}
& \myparbox{
$\Symbol{\Vleo{l2}} = \LHS{\Veim{eim}}$
\becuz{}
\dref{def:eim-matching-leo-memo};
}
\\
\label{eq:leo-memos-match-uniquely-16}
& \myparbox{
$\Current{\Vleo{l2}} = \Left{\Veim{eim}}$
\becuz{}
\dref{def:eim-matching-leo-memo};
}
\\
\label{eq:leo-memos-match-uniquely-18}
& \myparbox{
\Symbol{\Vleo{l1}} = \Symbol{\Vleo{l2}}
\becuz{}
\eqref{eq:leo-memos-match-uniquely-12},
\eqref{eq:leo-memos-match-uniquely-16};
}
\\
\label{eq:leo-memos-match-uniquely-20}
& \myparbox{
$\Current{\Vleo{l1}} = \Current{\Vleo{l2}}$
\becuz{}
\eqref{eq:leo-memos-match-uniquely-14},
\eqref{eq:leo-memos-match-uniquely-18}; and
}
\\
\label{eq:leo-memos-match-uniquely-22}
& \myparbox{
\Vleo{l1} = \Vleo{l2}
\becuz{}
\tref{t:leo-memo-uniqueness-by-locsym}.
}
\end{align}
Equation
\eqref{eq:leo-memos-match-uniquely-22} contradicts
our assumption for the reductio,
and shows the theorem.
\end{proof}

\begin{theorem}
\ttitle{Leo memo dotted rule is telluric}
\label{t:leo-memo-dotted-rule-is-telluric}
The dotted rule of a valid Leo memo is telluric.
\end{theorem}

\begin{proof}
Every Leo memo is in a catena, even if it is only a
trivial catena of length 1.
Therefore, if there is a Leo memo that is not telluric,
there is a catena that contains it, call it \var{cat}.
We assume, for a reductio, that such a \var{cat} exists,
and therefore that
\begin{equation}
\label{eq:leo-memo-dotted-rule-is-telluric-10}
\tag{RAA}
\exists \; \var{ix} : \text{\DR{\Vel{cat}{ix}} is not telluric}
\end{equation}

A Leo catena is finite in length
\tref{t:leo-catenas-are-finite}.
Therefore, if any \var{ix} satisfies
\eqref{eq:leo-memo-dotted-rule-is-telluric-10}
then there is a last \var{ix} that satisfies
\eqref{eq:leo-memo-dotted-rule-is-telluric-10}.
Let the last \var{ix} that satisfies
\eqref{eq:leo-memo-dotted-rule-is-telluric-10}
be \var{z}, so that
\begin{equation}
\label{eq:leo-memo-dotted-rule-is-telluric-12}
\forall \; \var{i} : \var{z} < \var{i} \le \Vlastix{cat}
\implies \text{\Vel{cat}{i} is telluric}.
\end{equation}

Assume for that inner reductio, that
\begin{align}
\label{eq:leo-memo-dotted-rule-is-telluric-13}
\tag{RA1}
& \myparbox{%
$\var{z} = \Vlastix{cat}$; so that
}
\\
\label{eq:leo-memo-dotted-rule-is-telluric-15}
& \myparbox{%
\Vel{cat}{z} has no top-down cause
\becuz{}
\dref[catena]{def:leo-catena};
}
\\
\label{eq:leo-memo-dotted-rule-is-telluric-16}
& \myparbox{%
$\DR{\Vel{cat}{z}} =
\Next{\DR{\Veim{basis}}}$,
where \Veim{basis} is the basis of \Vel{cat}{z}
\becuz{}
\eqref{eq:leo-memo-dotted-rule-is-telluric-15},
\dref[validity of Leo memo with no top-down cause]{def:validity-of-leo-memo};
}
\\
\label{eq:leo-memo-dotted-rule-is-telluric-19}
& \myparbox{%
$\Postdot{\Veim{basis}} \neq \epsilon$
\becuz{}
\dref[basis of a Leo memo]{def:basis-of-leo-memo};
and
}
\\
\label{eq:leo-memo-dotted-rule-is-telluric-22}
& \myparbox{%
\Next{\DR{\Veim{basis}}}
is telluric
\becuz{}
\eqref{eq:leo-memo-dotted-rule-is-telluric-19}.
}
\intertext{
Equation
\eqref{eq:leo-memo-dotted-rule-is-telluric-22}
shows the inner reductio,
from which we conclude that
}
\label{eq:leo-memo-dotted-rule-is-telluric-25}
& 0 \le \var{z} < \Vlastix{cat};
\\
\label{eq:leo-memo-dotted-rule-is-telluric-28}
& \exists \; \el{cat}{\Vincr{z}}
\becuz{}
\eqref{eq:leo-memo-dotted-rule-is-telluric-25};
\\
\label{eq:leo-memo-dotted-rule-is-telluric-31}
& \myparbox{
\el{cat}{\Vincr{z}} is a top-down cause of \Vel{cat}{z}
\becuz{}
\eqref{eq:leo-memo-dotted-rule-is-telluric-28},
\dref[catena]{def:leo-catena};
}
\\
\label{eq:leo-memo-dotted-rule-is-telluric-34}
& \myparbox{
\DR{\Vel{cat}{z}} = \DR{\el{cat}{\Vincr{z}}}
\becuz{}
\eqref{eq:leo-memo-dotted-rule-is-telluric-31},
\dref[validity of Leo memo with top-down cause]{def:validity-of-leo-memo};
}
\\
\label{eq:leo-memo-dotted-rule-is-telluric-37}
& \myparbox{
\DR{\Vel{cat}{z}} is telluric
\becuz{}
\eqref{eq:leo-memo-dotted-rule-is-telluric-12},
\eqref{eq:leo-memo-dotted-rule-is-telluric-34}.
}
\end{align}
But our assumption for \var{z} was that it was not telluric,
so that
\eqref{eq:leo-memo-dotted-rule-is-telluric-37}
shows the outer reductio.
\end{proof}

\chapter{Leo effects}

\begin{definition}
\dtitle{Leo silo effect}
\label{def:direct-leo-silo-effect}
We say that \Veim{eff}
is the
\dfn{direct Leo silo effect}
of \Veim{cuz}
if and only if
\begin{itemize}
\item
\Veim{cuz} is a valid EIM;
\item
\Vleo{l} is an instantiated Leo memo that matches \Veim{cuz}; and
\item
\Veim{eff} is an effect of \Veim{cuz}.
\end{itemize}
For brevity,
a direct Leo silo effect is
also called a
\dfn{direct Leo effect}.
\end{definition}

\begin{figure}[tb]
\figtitle{Direct Leo effect}{fig:direct-leo-effect}
\vspace{\baselineskip}
\begin{tikzcd}[column sep=huge, row sep=huge]
?\Vleo{l2}?
\arrow[dd, rightarrow]
&
& \Veim{cuz}
\arrow[dd, Rightarrow]
\arrow[dl, dotted, rightarrow, two heads]
\\
& \Veim{bas}
  \arrow[ul, dotted, leftrightarrow]
  \arrow[dr, rightarrow]
  \arrow[dl, Rightarrow]
&
\\
\Vleo{l}
  \arrow[uurr, dotted, swap, leftrightarrow, bend left]
  \arrow[ur, bend right, dotted, rightarrow, two heads]
& & \Veim{eff}
\end{tikzcd}
\vspace{.5\baselineskip}
\begin{flushleft}
\begin{tikzcd}
\var{down} \arrow[r, rightarrow] & \var{effect}
\end{tikzcd}:
\var{down} is the top-down cause of \var{effect}.
\\[-.4em]
\begin{tikzcd}
\var{up} \arrow[r, Rightarrow] & \var{effect}
\end{tikzcd}:
\var{up} is the bottom-up cause of \var{effect}.
\\[-.5em]
\begin{tikzcd}
\var{a} \arrow[r, dotted, leftrightarrow] & \var{b}
\end{tikzcd}:
\LSY{\var{a}} matches \LSY{\var{b}}.
\\[-.2em]
\begin{tikzcd}
\var{a} \arrow[r, rightarrow, dotted, two heads] & \var{b}
\end{tikzcd}:
\LSY{\var{a}} matches \PLSY{\var{b}}.
\par
The node for \Vleo{l2} is optional.
For a proof of correctness,
see \tref{t:direct-leo-effect-summary}.
\end{flushleft}
\vspace{.5\baselineskip}
\end{figure}

\begin{theorem}
\ttitle{Direct Leo effect summary}
\label{t:direct-leo-effect-summary}
Figure \ref{fig:direct-leo-effect}
is correct.
\end{theorem}

\begin{proof}
In this proof, we justify the existence
and form
of
the nodes and arrows of 
Figure \ref{fig:direct-leo-effect}.
Figure \ref{fig:direct-leo-effect}
illustrates a direct Leo effect,
which from
\dref[direct Leo silo effect]{def:direct-leo-silo-effect}
is a \Veim{eff}
such that the following preconditons hold:
\begin{align}
\label{eq:direct-leo-effect-summary-10}
& \myparbox{%
\Veim{cuz} is a valid EIM.
} \\
\label{eq:direct-leo-effect-summary-12}
& \myparbox{%
\Vleo{l} is an instantiated Leo memo.
} \\
\label{eq:direct-leo-effect-summary-14}
& \myparbox{%
\Vleo{l} matches \Veim{cuz}.
}
\end{align}

We take preconditions
\eqref{eq:direct-leo-effect-summary-10},
\eqref{eq:direct-leo-effect-summary-12}
and
\eqref{eq:direct-leo-effect-summary-14}
as assumptions for this theorem.

\begin{align}
\label{eq:direct-leo-effect-summary-20}
& \myparbox{%
There is exactly one \Veim{bas},
such that \Veim{bas} is valid
and the basis of \Vleo{l}
\becuz{}
\eqref{eq:direct-leo-effect-summary-12},
\tref{t:leo-basis-uniqueness}.
} \\
\label{eq:direct-leo-effect-summary-22}
& \myparbox{%
\Veim{cuz} is the bottom-up cause of an effect,
call it \Veim{eff}.
\becuz{}
\eqref{eq:direct-leo-effect-summary-10},
\eqref{eq:direct-leo-effect-summary-12},
\eqref{eq:direct-leo-effect-summary-14},
\tref{t:leo-match-props}.
} \\
\label{eq:direct-leo-effect-summary-24}
& \myparbox{%
\Veim{bas} is the top-down cause of \Veim{eff}
\becuz{}
\eqref{eq:direct-leo-effect-summary-10},
\eqref{eq:direct-leo-effect-summary-12},
\eqref{eq:direct-leo-effect-summary-14},
\eqref{eq:direct-leo-effect-summary-20},
\eqref{eq:direct-leo-effect-summary-22},
\tref{t:leo-match-props}.
} \\
\label{eq:direct-leo-effect-summary-26}
& \myparbox{%
\Veim{bas} is a top-down matching cause of \Veim{cuz}
\becuz{}
\eqref{eq:direct-leo-effect-summary-10},
\eqref{eq:direct-leo-effect-summary-12},
\eqref{eq:direct-leo-effect-summary-14},
\eqref{eq:direct-leo-effect-summary-20},
\eqref{eq:direct-leo-effect-summary-22},
\tref{t:leo-match-props}.
} \\
\label{eq:direct-leo-effect-summary-28}
& \myparbox{%
$\PLSY{\Veim{bas}} = \LSY{\Veim{cuz}}$
\becuz{}
\eqref{eq:direct-leo-effect-summary-26},
\dref[matching causes]{def:matching-causes}.
} \\
\label{eq:direct-leo-effect-summary-30}
& \myparbox{%
$\LSY{\Vleo{l}} = \LSY{\Veim{cuz}}$
\becuz{}
\eqref{eq:direct-leo-effect-summary-14},
\dref[matching Leo memo]{def:eim-matching-leo-memo}.
} \\
\label{eq:direct-leo-effect-summary-32}
& \myparbox{%
$\LSY{\Vleo{l}} = \PLSY{\Veim{bas}}$
\becuz{}
\eqref{eq:direct-leo-effect-summary-20},
\dref[basis of a Leo memo]{def:basis-of-leo-memo}.
}
\end{align}

Figure \ref{fig:direct-leo-effect} states that \Vleo{l2}
is optional.
We make the conditional assumption that
\begin{align}
\label{eq:direct-leo-effect-summary-100}
& \myparbox{%
\Vleo{l2} exists, is instantiated
and is the top-down cause of \Vleo{l}
\becuz{}
conditional ASM.
} \\
\label{eq:direct-leo-effect-summary-102}
& \myparbox{%
\LSY{\Veim{bas}} = \LSY{\Veim{l2}}
\becuz{}
\eqref{eq:direct-leo-effect-summary-20},
\eqref{eq:direct-leo-effect-summary-100},
\dref[Leo top-down cause]{def:down-cause-of-leo-memo}.
}
\end{align}

\textbf{Summary}:
For the nodes,
we have the correctness
of \Veim{cuz} \becuz{}
\eqref{eq:direct-leo-effect-summary-10};
the correctness of \Veim{bas} \becuz{}
\eqref{eq:direct-leo-effect-summary-20};
the correctness of \Veim{eff} \becuz{}
\eqref{eq:direct-leo-effect-summary-22};
the correctness of \Vleo{l} \becuz{}
\eqref{eq:direct-leo-effect-summary-12};
and the correctness of \Vleo{l2} \becuz{}
\eqref{eq:direct-leo-effect-summary-100}.
We have the correctness of the bottom-up cause
of \Vleo{l} from
\eqref{eq:direct-leo-effect-summary-20}
and
\dref[basis as bottom-up cause]{def:basis-of-leo-memo}.
We have the correctness of the bottom-up cause
of \Veim{eff} from
\eqref{eq:direct-leo-effect-summary-22}.
We have the correctness of the top-down causes
from
\eqref{eq:direct-leo-effect-summary-24}
and
\eqref{eq:direct-leo-effect-summary-100}.
We have the correctness of the LSY/LSY
matches from
\eqref{eq:direct-leo-effect-summary-30} and
\eqref{eq:direct-leo-effect-summary-102}.
We have the correctness of the LSY/PLSY
matches from
\eqref{eq:direct-leo-effect-summary-28}
and
\eqref{eq:direct-leo-effect-summary-32}.
\end{proof}

\begin{theorem}
\ttitle{Leo direct effect properties}
\label{t:leo-direct-effect-props}
We make the following assumptions:
\begin{subequations}
\renewcommand{\theequation}{A\arabic{equation}}
\begin{align}
\label{eq:leo-direct-effect-props-asm-1}
& \myparbox{%
\Veim{cuz} is a valid EIM.
} \\
\label{eq:leo-direct-effect-props-asm-2}
& \myparbox{%
\Vleo{l} is an instantiated Leo memo.
} \\
\label{eq:leo-direct-effect-props-asm-3}
& \myparbox{%
\Vleo{l} matches \Veim{cuz}.
}
\end{align}
\end{subequations}

If these assumptions hold, then
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:leo-direct-effect-props-req-0-5}
& \myparbox{%
\Vleo{l} has exactly one valid basis, \Veim{bas}.
} \\
\label{eq:leo-direct-effect-props-req-1}
& \myparbox{%
\Veim{cuz} and \Vleo{l} have exactly one valid direct Leo effect,
call it \Veim{eff}.
} \\
\label{eq:leo-direct-effect-props-req-2}
& \myparbox{%
\Veim{cuz} is a bottom-up cause of \Veim{eff}.
} \\
\label{eq:leo-direct-effect-props-req-3}
& \myparbox{%
\Veim{eff} is the only effect of \Veim{cuz}.
} \\
\label{eq:leo-direct-effect-props-req-3-1}
& \myparbox{%
\Veim{bas} is the only matching top-down cause
of \Veim{cuz}.
} \\
\label{eq:leo-direct-effect-props-req-3-2}
& \myparbox{%
The cause-pair
$[ \Veim{bas}, \Veim{cuz} ]$
is the cause of exactly one valid effect,
\Veim{eff}.
} \\
\label{eq:leo-direct-effect-props-req-4}
& \myparbox{%
$\Rule{\Veim{eff}} = \Rule{\Veim{bas}}$
} \\
\label{eq:leo-direct-effect-props-req-5}
& \myparbox{%
$\Right{\Veim{cuz}} = \Right{\Veim{eff}}$
} \\
\label{eq:leo-direct-effect-props-req-6}
& \myparbox{%
\Veim{eff} is right-recursive.
} \\
\label{eq:leo-direct-effect-props-req-6a}
& \myparbox{%
\Veim{cuz} is complete.
} \\
\label{eq:leo-direct-effect-props-req-7}
& \myparbox{%
\Veim{eff} is quasi-complete.
} \\
\label{eq:leo-direct-effect-props-req-8}
& \myparbox{%
\Veim{cuz} is a silo cause of \Veim{eff}.
} \\
\label{eq:leo-direct-effect-props-req-9}
& \myparbox{%
\Veim{eff} is the only silo effect of \Veim{cuz}.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
We begin with the assumptions for the theorem:
\begin{align}
\label{eq:leo-direct-effect-props-16}
& \myparbox{%
\Veim{bas} is the basis of \Vleo{l}
and \Valid{\Veim{bas}}
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1}
\dref{def:validity-of-leo-memo},
which shows
Requirement~\eqref{eq:leo-direct-effect-props-req-0-5}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-25}
& \myparbox{%
\Veim{cuz} is the cause of exactly one valid
effect, \Veim{eff}
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1},
\eqref{eq:leo-direct-effect-props-asm-2},
\eqref{eq:leo-direct-effect-props-asm-3},
\tref{t:leo-match-props}.
} \\
\label{eq:leo-direct-effect-props-26}
& \myparbox{%
\Veim{cuz} and \Vleo{l} have exactly one valid direct Leo effect,
which is \Veim{eff},
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1},
\eqref{eq:leo-direct-effect-props-asm-2},
\eqref{eq:leo-direct-effect-props-asm-3},
\eqref{eq:leo-direct-effect-props-25}
and
\dref[direct Leo silo effect]{def:direct-leo-silo-effect},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-1}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-27}
& \myparbox{%
\Veim{cuz} is a bottom-up cause of \Veim{eff}
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1},
\eqref{eq:leo-direct-effect-props-asm-2},
\eqref{eq:leo-direct-effect-props-asm-3},
\tref{t:leo-match-props},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-2}
of this theorem.
} \\
\label{eq:leo-direct-effect-props-28}
& \myparbox{%
\Veim{cuz} is the cause of exactly one valid effect,
call it \Veim{eff}
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1},
\eqref{eq:leo-direct-effect-props-asm-2},
\eqref{eq:leo-direct-effect-props-asm-3},
\tref{t:leo-match-props},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-3}
of this theorem.
} \\
\label{eq:leo-direct-effect-props-30}
& \myparbox{%
\Veim{bas} is the only matching top-down cause
of \Veim{cuz}
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1},
\eqref{eq:leo-direct-effect-props-asm-2},
\eqref{eq:leo-direct-effect-props-asm-3},
\tref{t:leo-match-props},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-3-1}
of this theorem.
} \\
\label{eq:leo-direct-effect-props-31}
& \myparbox{%
The cause-pair
$[ \Veim{bas}, \Veim{cuz} ]$
is the cause of exactly one valid effect,
\Veim{eff}
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-1},
\eqref{eq:leo-direct-effect-props-asm-2},
\eqref{eq:leo-direct-effect-props-asm-3},
\eqref{eq:leo-direct-effect-props-28},
\tref{t:leo-match-props},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-3-2}
of this theorem.
} \\
\label{eq:leo-direct-effect-props-34}
& \myparbox{%
$\Rule{\Veim{eff}} = \Rule{\Veim{bas}}$
\becuz{}
\eqref{eq:leo-direct-effect-props-31},
\tref{t:effect-from-symbolic-cause-pair}
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-4}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-36}
& \myparbox{%
$\Right{\Veim{eff}} = \Right{\Veim{cuz}}$
\becuz{}
\eqref{eq:leo-direct-effect-props-27},
\tref{t:confirmation-from-up-cause},
\tref{t:symbolic-causes-from-effect}
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-5}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-37}
& \myparbox{%
\Veim{bas} is Leo-eligible.
\becuz{}
\eqref{eq:leo-direct-effect-props-16},
\dref[basis of Leo memo]{def:basis-of-leo-memo}.
} \\
\label{eq:leo-direct-effect-props-37-1}
& \myparbox{%
\Veim{bas} is right-recursive.
\becuz{}
\eqref{eq:leo-direct-effect-props-37},
\dref[Leo-eligible]{def:leo-eligible}.
} \\
\label{eq:leo-direct-effect-props-38}
& \myparbox{%
\Veim{eff} is right-recursive
\becuz{}
\eqref{eq:leo-direct-effect-props-34},
\eqref{eq:leo-direct-effect-props-37-1},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-6}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-40}
& \myparbox{%
\Veim{cuz} is complete
\becuz{}
\eqref{eq:leo-direct-effect-props-asm-3},
\dref[matching Leo memo]{def:eim-matching-leo-memo}
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-6a}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-44}
& \myparbox{%
\Veim{bas} is a quasi-penult.
\becuz{}
\eqref{eq:leo-direct-effect-props-37},
\dref[Leo-eligible]{def:leo-eligible}.
} \\
\label{eq:leo-direct-effect-props-46}
& \var{suffix} \defined
\RHS{\Veim{bas}}
  \left[
  \begin{gathered}
  \Vincr{\Dotix{\Veim{bas}}} \\
  \quad \ldots \; \Vlastix{\RHS{\Veim{bas}}} \\
  \end{gathered}
  \right].
\\
\label{eq:leo-direct-effect-props-48}
& \myparbox{%
$\var{suffix} \derives \epsilon$
\becuz{}
\eqref{eq:leo-direct-effect-props-44},
\eqref{eq:leo-direct-effect-props-46},
\dref[quasi-penult DR]{def:quasi-types},
\dref[DR notions for EIM's]{def:eim-dr-notions}.
}
\intertext{%
Note that in
\eqref{eq:leo-direct-effect-props-48} we can say that \var{suffix} is nulling wherever it occurs,
because, in a Marpa grammar, every symbol is always either
telluric (non-nulling) or nulling --- there are no proper nullables.
}
\label{eq:leo-direct-effect-props-50}
& \myparbox{%
$\Dotix{\Veim{eff}} = \Vincr{\Dotix{\Veim{bas}}}$
\becuz{}
\eqref{eq:leo-direct-effect-props-31},
\dref[causes of confirmed EIM's]{def:causes-confirmed}.
} \\
\label{eq:leo-direct-effect-props-52}
& \myparbox{%
$\RHS{\Veim{eff}}[\Dotix{\Veim{eff}} \ldots \Vlastix{\RHS{\Veim{eff}}}] = \var{suffix}$
\becuz{}
\eqref{eq:leo-direct-effect-props-34},
\eqref{eq:leo-direct-effect-props-46},
\eqref{eq:leo-direct-effect-props-50}.
} \\
\label{eq:leo-direct-effect-props-54}
& \myparbox{%
$\RHS{\Veim{eff}}[\Dotix{\Veim{eff}} \ldots \Vlastix{\RHS{\Veim{eff}}}] \destar \epsilon$
\becuz{}
\eqref{eq:leo-direct-effect-props-48},
\eqref{eq:leo-direct-effect-props-52}.
} \\
\label{eq:leo-direct-effect-props-56}
& \myparbox{%
\Veim{eff} is quasi-complete
\becuz{}
\eqref{eq:leo-direct-effect-props-54},
\dref[quasi-penult DR]{def:quasi-types},
\dref[DR notions for EIM's]{def:eim-dr-notions},
which shows Requirement~\eqref{eq:leo-direct-effect-props-req-7}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-58}
& \myparbox{%
\Veim{cuz} is a silo cause of \Veim{eff}
\becuz{}
\eqref{eq:leo-direct-effect-props-27},
\eqref{eq:leo-direct-effect-props-36},
\eqref{eq:leo-direct-effect-props-40},
\eqref{eq:leo-direct-effect-props-56},
\dref[silo]{def:silo},
which is Requirement~\eqref{eq:leo-direct-effect-props-req-8}
for this theorem.
} \\
\label{eq:leo-direct-effect-props-60}
& \myparbox{%
\Veim{eff} is the only silo effect of \Veim{cuz}
\becuz{}
\eqref{eq:leo-direct-effect-props-25},
\eqref{eq:leo-direct-effect-props-58},
\dref{def:silo},
which is Requirement~\eqref{eq:leo-direct-effect-props-req-9}
for this theorem.
}
\end{align}
\end{proof}

\begin{theorem}
\ttitle{Matching memo of Leo effect}
\label{matching-memo-of-Leo-effect}
Assume that
\begin{subequations}
\renewcommand{\theequation}{A\arabic{equation}}
\begin{align}
\label{eq:matching-memo-of-leo-direct-effect-asm-1}
& \myparbox{%
\Veim{cuz} is a valid EIM.
} \\
\label{eq:matching-memo-of-leo-direct-effect-asm-2}
& \myparbox{%
\Vleo{l} is an instantiated Leo memo.
} \\
\label{eq:matching-memo-of-leo-direct-effect-asm-3}
& \myparbox{%
\Vleo{l} matches \Veim{cuz}.
}
\end{align}
\end{subequations}
Then
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:matching-memo-of-leo-direct-effect-req-0-5}
& \myparbox{%
\Veim{cuz} has exactly one 
direct Leo effect, \Veim{eff}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-req-1}
& \myparbox{%
If \Vleo{l} has an instantiated top-down cause,
call it \Vleo{eff},
then \Vleo{eff} matches \Veim{eff}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-req-2}
& \myparbox{%
If \Veim{eff} has an instantiated matching Leo memo,
call it \Vleo{eff},
then \Vleo{eff} is the top-down cause of \Vleo{l}.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
\begin{align}
\label{eq:matching-memo-of-leo-direct-effect-10}
& \myparbox{%
\Veim{cuz} has exactly one 
direct Leo effect, \Veim{eff}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-asm-1},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-2},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-3},
\eqref{eq:leo-direct-effect-props-req-1}
of \tref{t:leo-direct-effect-props},
which
shows
Requirement~\eqref{eq:matching-memo-of-leo-direct-effect-req-0-5}
of this theorem.
} \\
\label{eq:matching-memo-of-leo-direct-effect-11}
& \myparbox{%
\Vleo{l} has exactly one basis, call it \Veim{bas}
\becuz
\eqref{eq:matching-memo-of-leo-direct-effect-asm-2},
\tref{t:leo-basis-uniqueness}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-12}
& \myparbox{%
\Veim{bas} is the only matching top-down cause
of \Veim{cuz}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-asm-1},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-2},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-3},
\eqref{eq:leo-direct-effect-props-req-3-1}
of \tref{t:leo-direct-effect-props}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-14}
& \myparbox{%
The cause-pair
$[ \Veim{bas}, \Veim{cuz} ]$
is the cause of exactly one valid effect,
\Veim{eff}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-asm-1},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-2},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-3},
\eqref{eq:matching-memo-of-leo-direct-effect-10},
\eqref{eq:leo-direct-effect-props-req-3-2}
of \tref{t:leo-direct-effect-props}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-15}
& \myparbox{%
\Veim{eff} is a confirmed EIM
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-14},
\tref{t:confirmation-from-up-cause}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-16}
& \myparbox{%
$\Left{\Veim{bas}} = \Left{\Veim{eff}}$
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-14},
\eqref{eq:matching-memo-of-leo-direct-effect-15},
\dref[cause-pair of confirmed EIM]{def:causes-confirmed}
} \\
\label{eq:matching-memo-of-leo-direct-effect-18}
& \myparbox{%
$\Rule{\Veim{bas}} = \Rule{\Veim{eff}}$
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-asm-1},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-2},
\eqref{eq:matching-memo-of-leo-direct-effect-asm-3},
\eqref{eq:leo-direct-effect-props-req-4}
of \tref{t:leo-direct-effect-props}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-20}
& \myparbox{%
$\LSY{\Veim{bas}} = \LSY{\Veim{eff}}$
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-16},
\eqref{eq:matching-memo-of-leo-direct-effect-18}.
}
\end{align}

Requirement~\eqref{eq:matching-memo-of-leo-direct-effect-req-1}
is a conditional.
To show the conditional, we assume the antecedent to
show the consequent.
\begin{subequations}
\renewcommand{\theequation}{C1-\arabic{equation}}
\setlength{\mathparwidth}{\dimexpr\mathparwidth-1em}
\begin{align}
\label{eq:matching-memo-of-leo-direct-effect-C1-1}
& \myparbox{%
\Vleo{l} has an instantiated top-down cause,
call it \Vleo{eff}
\becuz{}
ASM for conditional.
} \\
\label{eq:matching-memo-of-leo-direct-effect-C1-3}
& \myparbox{%
\LSY{\Vleo{eff}} = \LSY{\Veim{bas}}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-11},
\eqref{eq:matching-memo-of-leo-direct-effect-C1-1},
\dref[Leo top-down cause]{def:down-cause-of-leo-memo}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-C1-5}
& \myparbox{%
\LSY{\Vleo{eff}} = \LSY{\Veim{eff}}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-20},
\eqref{eq:matching-memo-of-leo-direct-effect-C1-3}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-C1-7}
& \myparbox{%
\Vleo{eff} matches \Veim{eff}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-C1-5},
\dref[matching Leo memo]{def:eim-matching-leo-memo}.
}
\end{align}
\end{subequations}
Equations
\eqref{eq:matching-memo-of-leo-direct-effect-C1-1}--%
\eqref{eq:matching-memo-of-leo-direct-effect-C1-7}
show that we may conclude
\eqref{eq:matching-memo-of-leo-direct-effect-C1-7}
from
\eqref{eq:matching-memo-of-leo-direct-effect-C1-1},
which shows 
Requirement~\eqref{eq:matching-memo-of-leo-direct-effect-req-1}.

Requirement~\eqref{eq:matching-memo-of-leo-direct-effect-req-2}
is also a conditional.
Again we assume its antecendent to show its consequent.
\begin{subequations}
\renewcommand{\theequation}{C2-\arabic{equation}}
\setlength{\mathparwidth}{\dimexpr\mathparwidth-1em}
\begin{align}
\label{eq:matching-memo-of-leo-direct-effect-C2-1}
& \myparbox{%
\Vleo{eff} is instantiated and
matches \Veim{eff}
\becuz{}
ASM for conditional.
} \\
\label{eq:matching-memo-of-leo-direct-effect-C2-3}
& \myparbox{%
\LSY{\Vleo{eff}} = \LSY{\Veim{eff}}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-C2-1},
\dref[matching Leo memo]{def:eim-matching-leo-memo}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-C2-5}
& \myparbox{%
\LSY{\Vleo{eff}} = \LSY{\Veim{bas}}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-20},
\eqref{eq:matching-memo-of-leo-direct-effect-C2-3}.
} \\
\label{eq:matching-memo-of-leo-direct-effect-C2-7}
& \myparbox{%
\Vleo{l} has an instantiated top-down cause,
call it \Vleo{eff}
\becuz{}
\eqref{eq:matching-memo-of-leo-direct-effect-C2-1},
\eqref{eq:matching-memo-of-leo-direct-effect-C2-5},
\dref[Leo top-down cause]{def:down-cause-of-leo-memo}.
}
\end{align}
\end{subequations}
Equations
\eqref{eq:matching-memo-of-leo-direct-effect-C2-1}--%
\eqref{eq:matching-memo-of-leo-direct-effect-C2-7}
show that we may conclude
\eqref{eq:matching-memo-of-leo-direct-effect-C2-7}
from
\eqref{eq:matching-memo-of-leo-direct-effect-C2-1},
which shows 
Requirement~\eqref{eq:matching-memo-of-leo-direct-effect-req-2}.
\end{proof}

\begin{definition}
\dtitle{Indirect Leo silo effect}
\label{def:indirect-leo-silo-effect}
We say that \Veim{eff}
is the
\dfn{indirect Leo silo effect}
of \Veim{cuz}
if and only if
\begin{itemize}
\item
\Veim{cuz} is a valid EIM;
\item
\Vleo{l} is an instantiated Leo memo.
\item
\Vleo{l} does not match \Veim{cuz}.
\item
\Vleo{l} quasi-matches \Veim{cuz}.
\item
\Veim{eff} is a valid effect of \Veim{cuz}.
\end{itemize}
For brevity,
a indirect Leo silo effect is
also called a
\dfn{indirect Leo effect}.
\end{definition}

\begin{figure}[tb]
\figtitle{Indirect Leo effect}{fig:indirect-leo-effect}
\vspace{\baselineskip}
\begin{tikzcd}[column sep=huge, row sep=huge]
\Vleo{l}
  \arrow[r, leftrightarrow, dotted]
  \arrow[dr, leftrightarrow, dotted]
& \Veim{cuz}
\arrow[d, rightarrow]
\\
& \Veim{eff}
\end{tikzcd}
\vspace{.5\baselineskip}
\begin{flushleft}
\begin{tikzcd}
\var{down} \arrow[r, rightarrow] & \var{effect}
\end{tikzcd}:
\var{down} is the top-down cause of \var{effect}.
\\[-.3em]
\begin{tikzcd}
\var{a} \arrow[r, dotted, leftrightarrow] & \var{b}
\end{tikzcd}:
\LSY{\var{a}} quasi-matches \LSY{\var{b}}.
\par
For a proof of correctness,
see \tref{t:indirect-leo-effect-summary}.
\end{flushleft}
\vspace{.5\baselineskip}
\end{figure}

\begin{theorem}
\ttitle{Indirect Leo summary}
\label{t:indirect-leo-effect-summary}
Figure \ref{fig:indirect-leo-effect}
is correct.
\end{theorem}

\begin{proof}
In this proof, we justify the existence
and form
of
the nodes and arrows of 
Figure \ref{fig:indirect-leo-effect}.
Figure \ref{fig:indirect-leo-effect}
illustrates an indirect Leo effect,
which from
\dref[indirect Leo silo effect]{def:indirect-leo-silo-effect}
is an \Veim{eff}
such that the following preconditons hold:
\begin{align}
\label{eq:indirect-leo-effect-summary-10}
& \myparbox{%
\Veim{cuz} is a valid EIM.
} \\
\label{eq:indirect-leo-effect-summary-12}
& \myparbox{%
\Vleo{l} is an instantiated Leo memo.
} \\
\label{eq:indirect-leo-effect-summary-14}
& \myparbox{%
\Vleo{l} does not match \Veim{cuz}.
} \\
\label{eq:indirect-leo-effect-summary-16}
& \myparbox{%
\Vleo{l} quasi-matches \Veim{cuz}.
}
\end{align}

We take preconditions
\eqref{eq:indirect-leo-effect-summary-10},
\eqref{eq:indirect-leo-effect-summary-12},
\eqref{eq:indirect-leo-effect-summary-14}
and
\eqref{eq:indirect-leo-effect-summary-16}
as assumptions for this theorem.

\begin{align}
\label{eq:indirect-leo-effect-summary-22}
& \myparbox{%
\Veim{cuz} is incomplete
\becuz{}
\eqref{eq:indirect-leo-effect-summary-14},
\dref{def:quasi-matching-leo-memo},
\dref[matching Leo memo]{def:eim-matching-leo-memo}.
} \\
\label{eq:indirect-leo-effect-summary-24}
& \myparbox{%
\Veim{cuz} is the top-down cause of an
null-scan effect, call it \Veim{eff}
\becuz
\eqref{eq:indirect-leo-effect-summary-10},
\eqref{eq:indirect-leo-effect-summary-22},
\tref{t:null-scan-from-down-cause}.
} \\
\label{eq:indirect-leo-effect-summary-26}
& \myparbox{%
\Veim{cuz} and \Veim{eff} are in the same
fleeting closure
\becuz
\eqref{eq:indirect-leo-effect-summary-24}
\dref[fleeting closure]{def:fleeting-closure-sequence}.
} \\
\label{eq:indirect-leo-effect-summary-28}
& \myparbox{%
\Veim{cuz} and \Veim{eff} share the same EIM completion
\becuz
\eqref{eq:indirect-leo-effect-summary-26},
\tref{t:fc-shares-eim-completion}.
} \\
\label{eq:indirect-leo-effect-summary-29}
& \myparbox{%
\Veim{cuz} is quasi-complete
\becuz{}
\eqref{eq:indirect-leo-effect-summary-16},
\dref[quasi-matching Leo memo]{def:quasi-matching-leo-memo}.
} \\
\label{eq:indirect-leo-effect-summary-30}
& \myparbox{%
\Vleo{l} quasi-matches \Veim{eff}
\becuz
\eqref{eq:indirect-leo-effect-summary-28},
\eqref{eq:indirect-leo-effect-summary-29},
\dref[quasi-matching Leo memo]{def:quasi-matching-leo-memo}.
}
\end{align}

\textbf{Summary}:
For the nodes,
we have the correctness
of \Veim{cuz} \becuz{}
\eqref{eq:indirect-leo-effect-summary-10};
the correctness of \Vleo{l} \becuz{}
\eqref{eq:indirect-leo-effect-summary-12};
and
the correctness of \Veim{eff} \becuz{}
\eqref{eq:indirect-leo-effect-summary-24}.
We have the correctness of the top-down cause
of \Veim{eff} from
\eqref{eq:indirect-leo-effect-summary-24}.
We have the correctness of the
quasi-matches from
\eqref{eq:indirect-leo-effect-summary-16}
and
\eqref{eq:indirect-leo-effect-summary-28}.
\end{proof}

TODO: TOHERE

\begin{theorem}
\ttitle{Leo indirect effect properties}
\label{t:leo-indirect-effect-props}
We make the following assumptions:
\begin{subequations}
\renewcommand{\theequation}{A\arabic{equation}}
\begin{align}
\label{eq:leo-indirect-effect-props-asm-1}
& \myparbox{%
\Veim{cuz} is a valid EIM.
} \\
\label{eq:leo-indirect-effect-props-asm-2}
& \myparbox{%
\Vleo{l} is an instantiated Leo memo.
} \\
\label{eq:leo-indirect-effect-props-asm-3}
& \myparbox{%
\Vleo{l} does not match \Veim{cuz}.
} \\
\label{eq:leo-indirect-effect-props-asm-4}
& \myparbox{%
\Vleo{l} quasi-matches \Veim{cuz}.
}
\end{align}
\end{subequations}

If these assumptions hold, then
\begin{subequations}
\renewcommand{\theequation}{R\arabic{equation}}
\begin{align}
\label{eq:leo-indirect-effect-props-req-0-5}
& \myparbox{%
\Vleo{l} has exactly one valid basis, \Veim{bas}.
} \\
\label{eq:leo-indirect-effect-props-req-1}
& \myparbox{%
\Veim{cuz} and \Vleo{l} have exactly one valid indirect Leo effect,
call it \Veim{eff}.
} \\
\label{eq:leo-indirect-effect-props-req-2}
& \myparbox{%
\Veim{cuz} is a top-down cause of \Veim{eff}.
} \\
\label{eq:leo-indirect-effect-props-req-3}
& \myparbox{%
\Veim{eff} is the only effect of \Veim{cuz}.
} \\
& \myparbox{%
The only bottom-up cause of
\Veim{eff} is ethereal.
} \\
\label{eq:leo-indirect-effect-props-req-4}
& \myparbox{%
\Veim{cuz} is the only top-down cause
of \Veim{eff}.
} \\
\label{eq:leo-indirect-effect-props-req-5}
& \myparbox{%
$\Rule{\Veim{eff}} = \Rule{\Veim{cuz}}$.
} \\
\label{eq:leo-indirect-effect-props-req-6}
& \myparbox{%
$\Right{\Veim{eff}} = \Right{\Veim{cuz}}$.
} \\
\label{eq:leo-indirect-effect-props-req-7}
& \myparbox{%
\Veim{cuz} is quasi-complete.
} \\
\label{eq:leo-indirect-effect-props-req-8}
& \myparbox{%
\Veim{cuz} is incomplete.
} \\
\label{eq:leo-indirect-effect-props-req-9}
& \myparbox{%
\Veim{eff} is quasi-complete.
} \\
\label{eq:leo-indirect-effect-props-req-10}
& \myparbox{%
\Veim{cuz} is a silo cause of \Veim{eff}.
} \\
\label{eq:leo-indirect-effect-props-req-11}
& \myparbox{%
\Veim{eff} is the only silo effect of \Veim{cuz}.
} \\
\label{eq:leo-indirect-effect-props-req-12}
& \myparbox{%
\Vleo{l} quasi-matches \Veim{eff}.
}
\end{align}
\end{subequations}
\end{theorem}

\begin{proof}
\begin{align}
\label{eq:leo-indirect-effect-props-10}
& \myparbox{%
\Vleo{l} has exactly one valid basis, \Veim{bas},
\becuz{}
\eqref{eq:leo-indirect-effect-props-asm-2},
\tref{t:leo-basis-uniqueness},
which is
Requirement~\eqref{eq:leo-indirect-effect-props-req-0-5}
of this theorem.
} \\
\label{eq:leo-indirect-effect-props-30}
& \myparbox{%
\Veim{cuz} and \Vleo{l} have exactly one valid indirect Leo effect,
call it \Veim{eff},
\becuz{}
TODO
which is
Requirement~\eqref{eq:leo-indirect-effect-props-req-1}
of this theorem.
} \\
\end{align}
\end{proof}

TODO: pieces.
\dref[Leo-eligible]{def:leo-eligible}.
\dref[Leo top-down cause]{def:down-cause-of-leo-memo}.
\dref[basis of Leo memo]{def:basis-of-leo-memo}.
\dref[causes of confirmed EIM]{def:causes-confirmed}.
\dref[matching Leo memo]{def:eim-matching-leo-memo}.
\dref[matching top-down and bottom-up causes]{def:matching-causes}.
\dref[quasi-penult]{def:quasi-types}.
\dref[silo]{def:silo}.

\begin{definition}
\dtitle{Leo effect}
\label{def:leo-effect}
A
\xdfn{Leo effect}{Leo effect!EIM}
is an EIM which
is either a direct Leo effect
or an indirect Leo effect.
If \Veim{eff} is a Leo effect,
the
\xdfn{Leo cause}{Leo cause!EIM, of an EIM}
of \Veim{eff}
is
the silo cause of \Veim{eff}.
We define a
\xdfn{Leo cause}{Leo cause!EIM}
to be any EIM which is the Leo cause
of some Leo effect.
\end{definition}

\chapter{Leo silos}

\begin{definition}
\dtitle{Leo silo}
\label{def:leo-silo}
Let
\begin{align*}
& \text{\Veim{lb} be a complete EIM;}
\\
& \text{\Vleo{l} be a matching Leo memo;}
\\
& \Veim{mem-top} = \big[ \DR{\Vleo{l}}, \Left{\Vleo{l}}, \Vloc{i} \big];
\\
& \begin{aligned}
& \text{\Veim{top} be a completion of \Veim{mem-top}, so that}
\\
& \qquad \DR{\Veim{top}} =
\big[ \Rule{\Veim{mem-top}}, \Vsize{\Rule{\Veim{mem-top}}}
\big] \; \text{and}
\\
  & \qquad \Left{\Veim{top}} = \Left{\Veim{mem-top}}.
\end{aligned}
\end{align*}
Let
\var{lsl} be a silo whose bottom
layer is \Veim{lb} and whose top layer is
\Veim{top}.
Then we say that
\begin{itemize}
\item
\var{lsl} is a
\xdfn{Leo silo}{Leo silo};
\item
that \Veim{lb}
is the
\dfn{bottom}%
\index{recce-definitions}{bottom@bottom (EIM)!of a Leo silo}
of \var{lsl};
\item
that \Veim{mem-top} is the
\dfn{memoized top}%
\index{recce-definitions}{memoized top@memoized top (EIM)!of a Leo silo}%
\index{recce-definitions}{top@top (EIM)!memoized, of a Leo silo}
of \var{lsl}; and
\item
that \Veim{top} is the
\dfn{completed top}%
\index{recce-definitions}{completed top@completed top (EIM)!of a Leo silo}%
\index{recce-definitions}{top@top (EIM)!completed, of a Leo silo},
or simply
\dfn{top},%
\index{recce-definitions}{top@top (EIM)!of a Leo silo}
of \var{lsl}.
\end{itemize}
\end{definition}

\begin{theorem}
\ttitle{Memoized top is telluric}
\label{t:memoized-top-is-telluric}
The memoized top of a Leo silo is telluric.
\end{theorem}

\begin{proof}
This theorem follows from
the definition of a memoized top,
and Theorem
\ref{t:leo-memo-dotted-rule-is-telluric}.
\end{proof}

\begin{theorem}
\label{t:leo-top-fleeting-closure}
Let \var{lsl} be a Leo silo.
Then the memoized top
of \var{lsl}
is the lasting base of a maximal
fleeting closure silo,
call it \var{mfcslo}.
Also the completion of \var{mfcslo}
is the completed top of \var{lsl}.
\end{theorem}

\begin{proof}
Let \Veim{memtop} be the
memoized top of \var{lsl}.
Since \Veim{memtop} is a layer of the Leo silo \var{lsl},
\Veim{memtop} is a silo layer
and therefore,
by the definition of a silo layer,
\Veim{memtop} is quasi-complete.
Since \Veim{memtop} is quasi-complete,
by Theorem
\ref{t:maximal-fleeting-closure-silo},
it is the base of a fleeting closure silo,
call it \var{fcslo}.
By Theorem
\ref{t:memoized-top-is-telluric},
we know that \Veim{memtop} is telluric,
so that, by the definition of a lasting base,
\Veim{memtop} is the lasting base of
\var{fcslo}; and
by the definition of a maximal fleeting closure,
\var{fcslo} is maximal.

Let $\var{mfcslo} = \var{fcslo}$.
If
\Veim{top} is the completion of \var{mfcslo},
from the definition of the completion of a fleeting
closure silo,
and the definition of the completed top of a Leo silo,
we see that the completion of \var{mfcslo} is
the completed top of \var{lsl}.
\end{proof}

\begin{theorem}
\ttitle{Sharing a Leo completed top is equivalent to sharing a memoized top}
\label{t:memoized-top-to-completed-top}
Two Leo silos have the same completed Leo top
if and only if they have the same memoized Leo top.
\end{theorem}

\begin{proof}
Let \var{lsl1} be a Leo silo whose memoized top is \Veim{mem1}
and whose completed top is \Veim{comp1}.
Let \var{lsl2} be a Leo silo whose memoized top is \Veim{mem2}
and whose completed top is \Veim{comp2}.
We proceed first with the ``if'' direction,
by assuming that
\begin{equation}
\label{t:memoized-top-to-completed-top-10}
\Veim{mem1} = \Veim{mem2}
\end{equation}
to show that
\Veim{comp1} = \Veim{comp2}.
\begin{align}
\label{t:memoized-top-to-completed-top-12}
& \myparbox{\Veim{mem1} and \Veim{comp1} share a fleeting closure
$\because$ Th \ref{t:leo-top-fleeting-closure};}
\\
\label{t:memoized-top-to-completed-top-14}
& \myparbox{\Veim{mem2} and \Veim{comp2} share a fleeting closure
$\because$ Th \ref{t:leo-top-fleeting-closure};}
\\
\label{t:memoized-top-to-completed-top-16}
& \myparbox{$\Rule{\var{comp1}} = \Rule{\var{comp2}} = \Rule{\var{mem1}} = \Rule{\var{mem2}}
\because \eqref{t:memoized-top-to-completed-top-10},
\eqref{t:memoized-top-to-completed-top-12},
\eqref{t:memoized-top-to-completed-top-14};
$}
\\
\label{t:memoized-top-to-completed-top-18}
& \myparbox{$\Left{\var{comp1}} = \Left{\var{comp2}} = \Left{\var{mem1}} = \Left{\var{mem2}}
\because \eqref{t:memoized-top-to-completed-top-10},
\eqref{t:memoized-top-to-completed-top-12},
\eqref{t:memoized-top-to-completed-top-14};
$}
\\
\label{t:memoized-top-to-completed-top-20}
& \myparbox{$\Current{\var{comp1}} = \Current{\var{comp2}} = \Current{\var{mem1}} = \Current{\var{mem2}}
\because \eqref{t:memoized-top-to-completed-top-10},
\eqref{t:memoized-top-to-completed-top-12},
\eqref{t:memoized-top-to-completed-top-14};
$}
\intertext{We know that
\Veim{comp1} and \Veim{comp2} are the completions of fleeting closures
and therefore are complete EIM's, and since by 
(TODO -- is this right?)
\eqref{t:memoized-top-to-completed-top-20}
they are completions of the same rule,}
\label{t:memoized-top-to-completed-top-22}
& \Dotix{\var{comp1}} = \Dotix{\var{comp2}}, \text{so that}
\\
\label{t:memoized-top-to-completed-top-24}
& \Veim{comp1} = \Veim{comp2} \because
\eqref{t:memoized-top-to-completed-top-16},
\eqref{t:memoized-top-to-completed-top-18},
\eqref{t:memoized-top-to-completed-top-20},
\eqref{t:memoized-top-to-completed-top-22};
\end{align}
where
\eqref{t:memoized-top-to-completed-top-24}
is what we needed to show for the ``if'' direction.

For the only if direction,
we assume that
\begin{equation}
\label{t:memoized-top-to-completed-top-30}
\Veim{comp1} = \Veim{comp2}
\end{equation}
and proceed as follows:
\begin{align}
\label{t:memoized-top-to-completed-top-32}
& \myparbox{\Veim{mem1} is the lasting base of \Veim{comp1}
$\because$ Th \ref{t:leo-top-fleeting-closure};}
\\
\label{t:memoized-top-to-completed-top-33}
& \myparbox{\Veim{mem2} is the lasting base of \Veim{comp2}
$\because$ Th \ref{t:leo-top-fleeting-closure};}
\intertext{and since by
Theorem \ref{t:eim-lasting-base},
every EIM has exactly one lasting base,
}
\label{t:memoized-top-to-completed-top-34}
& \myparbox{
$\Veim{mem1} = \Veim{mem2}
\because$
\eqref{t:memoized-top-to-completed-top-30},
\eqref{t:memoized-top-to-completed-top-32},
\eqref{t:memoized-top-to-completed-top-33},
Th
\ref{t:eim-lasting-base};
}
\end{align}
where
\eqref{t:memoized-top-to-completed-top-34}
is what we needed to show for the ``only if''
direction.
\end{proof}

\begin{definition}
\dtitle{Silo layers by level}
Let \var{lsl} be a Leo silo,
let \var{topmfc} be the maximal fleeting silo
containing the memoized top layer of \var{lsl}
and let \Veim{lb} be the bottom layer of \var{lsl}.
Let \Veim{lyr} be a layer of \var{lsl}.
We say that \Veim{lyr} is
\begin{itemize}
\item
an \xdfn{inner}{inner (layer of a Leo silo)}
layer
if $\Veim{lyr} \neq \Veim{lb} \land \Veim{layer} \notin \var{topmfc}$;
\item
a \xdfn{lower}{lower (layer of a Leo silo)}
layer of \var{lsl}
if $\Veim{layer} \notin \var{topmfc}$;
\item
an \xdfn{upper}{upper (layer of a Leo silo)}
layer of \var{lsl}
if $\Veim{lyr} \neq \Veim{lb}$; and
\item
an \xdfn{outer}{outer (layer of a Leo silo)}
layer of \var{lsl} if
\Veim{lyr} is not an inner
layer of \var{lsl}.
\end{itemize}
\end{definition}

\begin{theorem}
\label{t:catena-determines-leo-top}
Given a specific choice of location,
every element of a Leo catena has the same
memoized Leo top item,
and the same completed Leo top item.
\end{theorem}

\begin{proof}
Let \var{cat} be a catena.
Every element of \var{cat} has the same origin and dotted rule
\tref{t:catena-top-elements-identical}.
This means they have the same memoized Leo top
\dref[memoized Leo top]{def:leo-silo}.
Since every element of \var{cat} has the same memoized Leo top,
every element of \var{cat} has the same completed Leo top
\tref{t:memoized-top-to-completed-top}.
\end{proof}

\begin{lemma}
\label{lem:leo-memo-of-incomplete-eim}
Let \Veim{cuz} be a valid EIM which is quasi-complete,
but incomplete.
Then
there is a valid \Veim{eff} such that
\Veim{eff}
is the unique silo effect of
\Veim{cuz}.
\end{lemma}

\begin{proof}
Since, by assumption for the theorem,
\Veim{cuz} is incomplete, it has a postdot symbol.
Since, by assumption for the theorem,
\Veim{cuz} is quasi-complete, the postdot symbol must be nulling.
\Veim{cuz} is therefore the top-down cause of a null-scan,
so that,
by Theorem \ref{t:null-scan-from-down-cause},
there is a valid \Veim{eff} such that
\begin{equation}
\label{eq:lem-leo-memo-of-incomplete-eim-9}
\text{\Veim{eff}
is the unique effect
of \Veim{cuz},}
\end{equation}
and \Veim{eff} is such that
\begin{equation}
\label{eq:lem-leo-memo-of-incomplete-eim-10a}
\Right{\Veim{cuz}} = \Right{\Veim{eff}}
\end{equation}

\Veim{cuz} is quasi-complete by assumption for the theorem,
so that from
\eqref{eq:lem-leo-memo-of-incomplete-eim-10a}
we know that
\begin{equation}
\label{eq:lem-leo-memo-of-incomplete-eim-11}
\text{\Veim{eff} is quasi-complete}.
\end{equation}
From
\eqref{eq:lem-leo-memo-of-incomplete-eim-9},
\eqref{eq:lem-leo-memo-of-incomplete-eim-10a},
and \eqref{eq:lem-leo-memo-of-incomplete-eim-11},
we see that
\Veim{eff}
is the unique silo effect
of \Veim{cuz}.
\end{proof}

\begin{theorem}
\ttitle{Leo silo uniqueness}
\label{t:leo-silo-uniqueness}
let \Vleo{leo} be an instantiated Leo memo;
and let \Veim{lb} be a valid EIM that matches
\Vleo{leo}.
Then there is exactly one fleeting Leo silo
with \Veim{lb} as its bottom layer.
\end{theorem}

\begin{proof}
We assume, for a reductio and without loss of generality,
that \var{lsl1} and \var{lsl2} are two distinct Leo silos
such that
\begin{equation}
\label{eq:leo-silo-uniqueness-10}
\el{lsl1}{0} = \Veim{lb} = \el{lsl2}{0}.
\end{equation}

If \var{lsl1} and \var{lsl2} are distinct,
then
\begin{equation}
\label{eq:leo-silo-uniqueness-12}
\exists \; \var{ix} : \Vel{lsl1}{ix} \neq \Vel{lsl2}{ix}.
\end{equation}
Let, \var{ix1} be the first index in which \var{lsl1}
and \var{lsl2} differ, so that
\begin{equation}
\label{eq:leo-silo-uniqueness-15}
\Vel{slo1}{ix1} \neq \Vel{slo2}{ix1} \; \land \; (\forall \; \var{a} : 0 \le \var{a} < \var{ix1} \implies
\Vel{slo1}{ix1} = \Vel{slo2}{ix1}).
\end{equation}
From \eqref{eq:leo-silo-uniqueness-10}
we know that $\var{ix} > 0$.

TODO: finish.
\end{proof}

\section{Reconstructing Leo silos}

\begin{algorithm}[tb]
\algtitle{Reconstruct memoized EIM's}{alg:reconstruct-memoized-eims}
\begin{algorithmic}[1]
\Procedure{Reconstruct}{\Veim{lb}}
\Statex \Veim{lb} is required to be valid, complete,
  and to have an instantiated matching Leo memo
\label{line:reconstruct-memoized-eims-preloop-5}
\State $\Veim{up} \gets \Veim{lb}$
\label{line:reconstruct-memoized-eims-preloop-10}
\State $\Vleo{memo} \gets$ the matching Leo memo of \Veim{lb}
\label{line:reconstruct-memoized-eims-preloop-20}
\While{ $\Vleo{memo} \neq \undefined$ and \Vleo{memo} is instantiated }
\label{line:reconstruct-memoized-eims-loop-first}
\Statex
\Comment This line is also referred to as \var{top}
\State \Veim{down} $\gets$ basis of \Vleo{memo}
\label{line:reconstruct-memoized-eims-loop-20}
\State \Veim{lasting} $\gets$ effect of \Veim{down}, \Veim{up}
\label{line:reconstruct-memoized-eims-loop-23}
\Statex
\Comment On lines \ref{line:reconstruct-memoized-eims-loop-20}--%
\ref{line:reconstruct-memoized-eims-loop-23}, %
  see Theorem \ref{t:leo-effect}
\State \var{mfc} $\gets$ maximal fleeting closure of \Veim{lasting}
\label{line:reconstruct-memoized-eims-loop-39}
\For{$\Veim{new} \in \var{mfc}$}
\If{\Veim{new} is not already in the Earley tables}
\State Add \Veim{new} to the Earley tables
\label{line:reconstruct-memoized-eims-loop-41}
\EndIf
\EndFor
\State $\Veim{up} \gets \el{mfc}{\Vlastix{mfc}}$
\label{line:reconstruct-memoized-eims-loop-43}
\Statex
\Comment \el{mfc}{\Vlastix{mfc}} is the completion of \var{mfc}
\State \Vleo{memo} $\gets$ top-down cause of \Vleo{memo}
\label{line:reconstruct-memoized-eims-loop-46}
\EndWhile
\label{line:reconstruct-memoized-eims-loop-last}
% \label{line:reconstruct-memoized-eims-90}
\EndProcedure
\end{algorithmic}
\end{algorithm}

This section will present,
and will present several theorems whose proofs
require,
Algorithm \ref{alg:reconstruct-memoized-eims}.
In this section,
we will call the loop in
lines
\ref{line:reconstruct-memoized-eims-loop-first}--%
\ref{line:reconstruct-memoized-eims-loop-last}
of Algorithm \ref{alg:reconstruct-memoized-eims},
the ``main loop''.
By the ``top of the main loop'' we will mean
the point
just after the execution of
line \ref{line:reconstruct-memoized-eims-loop-first}.
we will often refer to
line \ref{line:reconstruct-memoized-eims-loop-first}
as a variable name: \var{top}.

We will write \vat{\var{v}}{\var{n}} for the value
of \var{v} just after the execution of line \var{n} of
of Algorithm \ref{alg:reconstruct-memoized-eims}.
We will write \vatp{\var{v}}{\var{n}}{\var{p}} for the value
of \var{v} just after the execution of line \var{n}
of Algorithm \ref{alg:reconstruct-memoized-eims}
on the \var{p}'th pass through the main loop.

EIM's are added
by Algorithm \ref{alg:reconstruct-memoized-eims}
only at line
\ref{line:reconstruct-memoized-eims-loop-41},
and every EIM added 
at line \ref{line:reconstruct-memoized-eims-loop-41},
is contained in
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{p}}
for some \var{p}.
If $\Veim{eim} \in 
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{p}}$,
we say that 
\Veim{eim} is ``potentially added''
by Algorithm \ref{alg:reconstruct-memoized-eims}
in pass \var{p}.
An EIM potentially added in pass \var{p} will actually be
added only if it is not a duplicate of an EIM already
in the Earley tables.

We first show that 
Algorithm \ref{alg:reconstruct-memoized-eims}
is well-formed.
In this context, ``well-formed'' means that all variables
are either well-defined, or have their undefinedness
provided for in the algorithm.

\begin{theorem}
\ttitle{Leo reconstruction well-formedness}
\label{t:leo-reconstruction-wellformedness}
Let Algorithm \ref{alg:reconstruct-memoized-eims}
be called as
\call{Reconstruct}{\Vleo{leo}, \Veim{lb}},
where \mycallname{Reconstruct} is as specified in
Algorithm \ref{alg:reconstruct-memoized-eims},
\Vleo{leo} is an instantiated Leo memo,
and \Veim{lb} is a valid EIM that matches
\Vleo{leo}.
Then
\begin{gather*}
\text{Algorithm \ref{alg:reconstruct-memoized-eims}
is well-formed;
}
\end{gather*}
and, where \var{x} is a pass through the main loop,
\begin{equation}
\label{t:leo-reconstruction-wellformedness-10}
\tag{IND}
\begin{gathered}
\text{
\vatp{\Veim{up}}{\var{top}}{\var{x}}
is valid and complete;
}
\\
\text{
\vatp{\Vleo{memo}}{\var{top}}{\var{x}}
is instantiated; and
}
\\
\text{
\Memo{\vatp{\Veim{up}}{\var{top}}{\var{x}}}
= \vatp{\Vleo{memo}}{\var{top}}{\var{x}}
}
\end{gathered}
\end{equation}
\end{theorem}

\begin{proof}
We proceed by induction
on the number of passes through the main loop.
For the induction hypothesis, we use
\eqref{t:leo-reconstruction-wellformedness-10}.
We also use
\eqref{t:leo-reconstruction-wellformedness-10}
as a loop invariant
as described in
\cite{ED1976},
where the loop invariant, or ``guard'', is required be true after the test at the top
of a loop.
In our case,
\eqref{t:leo-reconstruction-wellformedness-10}.
is required to be true at top of the main loop.

By assumption for the theorem,
\vat{\Veim{lb}}{\ref{line:reconstruct-memoized-eims-preloop-5}}
is valid and complete and has a matching Leo memo,
which is instantiated.
From this we conclude that
\vat{\Veim{up}}{\ref{line:reconstruct-memoized-eims-preloop-10}}
and
\vat{\Vleo{memo}}{\ref{line:reconstruct-memoized-eims-preloop-20}}
are well-defined
and that
\eqref{t:leo-reconstruction-wellformedness-10}
is true for $\var{x} = 0$.
We take this as the basis of our induction.

For the step of the induction, we assume that
\eqref{t:leo-reconstruction-wellformedness-10} is true
for $\var{x} = \var{i}$,
to show that
\eqref{t:leo-reconstruction-wellformedness-10} is true
for $\var{x} = \Vincr{i}$.
By assumption for the step,
\vatp{\Veim{up}}{\var{top}}{\var{i}}
is valid and complete and matches
\vatp{\Vleo{memo}}{\var{top}}{\var{i}},
which is instantiated.
The effect of
\vatp{\Veim{up}}{\var{top}}{\var{i}}
and
\vatp{\Vleo{memo}}{\var{top}}{\var{i}}
is assigned to
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}.
We know from
Theorem \ref{t:leo-effect} that
\begin{align}
\label{t:leo-reconstruction-wellformedness-34}
& \myparbox{
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}
is valid and the silo effect of
\vatp{\Veim{up}}{\var{top}}{\var{i}}
$\because$
\eqref{eq:def-leo-effect-10},
\eqref{eq:def-leo-effect-10a};
}
\\
\label{t:leo-reconstruction-wellformedness-35}
& \myparbox{if
\vatp{\Vleo{memo}}{\var{top}}{\var{i}}
has an instantiated top-down cause, then
\Memo{\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}}
is the top-down cause of
\vatp{\Vleo{memo}}{\var{top}}{\var{i}}
$\because$
\eqref{eq:def-leo-effect-15};
}
\\
\notag
& \myparbox{
\vatp{\Vleo{memo}}{\ref{line:reconstruct-memoized-eims-loop-46}}{\var{i}}
is well-formed
$\because$
\eqref{t:leo-reconstruction-wellformedness-35};
}
\end{align}

We have shown that the assignments as far as
line \ref{line:reconstruct-memoized-eims-loop-23}
of Algorithm \ref{alg:reconstruct-memoized-eims}
are well-defined, and therefore that they are well-formed.
We will now show that the remaining assignments are well-formed.
By Theorem
\ref{t:maximal-fleeting-closure-validity}
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}
is in exactly one maximal fleeting closure,
so that
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{i}}
is well-defined.
Every fleeting closure, contains at least that EIM which is its base,
and a maximal fleeting closure, by its definition,
must contain its own lasting base.
Therefore
the maximal fleeting closure
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{i}}
contains at least one element,
so that
\vatp{\Veim{up}}{\ref{line:reconstruct-memoized-eims-loop-43}}{\var{i}}
is well-defined.

Finally, for line \ref{line:reconstruct-memoized-eims-loop-46},
we consider
\vatp{\Vleo{memo}}{\ref{line:reconstruct-memoized-eims-loop-46}}{\var{i}}
to be well-formed,
even if it is undefined.
Line \ref{line:reconstruct-memoized-eims-loop-first} filters out
the undefined values of \Vleo{memo}.

By
\eqref{t:leo-reconstruction-wellformedness-34},
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}
is a silo effect
and therefore, by the definition of a silo,
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}
is quasi-complete.
Since
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}
is quasi-complete,
by Theorem
\ref{t:maximal-fleeting-closure-silo},
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{i}}
is a fleeting closure silo.
By the properties of a fleeting closure silo,
we know that all of its layers are valid
and that its last layer is a complete EIM,
so that
\begin{align}
\label{t:leo-reconstruction-wellformedness-39}
& \myparbox{
\vatp{\Veim{up}}{\ref{line:reconstruct-memoized-eims-loop-43}}{\var{i}}
is valid and complete.
}
\\
\label{t:leo-reconstruction-wellformedness-40b}
& \myparbox{
Let \Vleo{next} be
the top-down cause of
\vatp{\Vleo{memo}}{\var{top}}{\var{i}}.
Note that \Vleo{next} may be undefined
or uninstantiated.
Then
}
\\
\label{t:leo-reconstruction-wellformedness-40d}
& \myparbox{
$\Memo{\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}}
=
\Vleo{next}
\because$
\eqref{t:leo-reconstruction-wellformedness-35},
\eqref{t:leo-reconstruction-wellformedness-40b};
}
\\
\label{t:leo-reconstruction-wellformedness-40e}
& \myparbox{
$\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{i}}
\in
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{i}}
\because$
Def of fleeting closure,
  line \ref{line:reconstruct-memoized-eims-loop-39};
}
\\
\label{t:leo-reconstruction-wellformedness-40g}
& \myparbox{
$\vatp{\Veim{up}}{\ref{line:reconstruct-memoized-eims-loop-43}}{\var{i}}
\in
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{i}}
\because$
line \ref{line:reconstruct-memoized-eims-loop-43};
}
\\
\label{t:leo-reconstruction-wellformedness-40i}
& \myparbox{
$\Memo{\vatp{\Veim{up}}{\ref{line:reconstruct-memoized-eims-loop-43}}{\var{i}}}
= \Vleo{next} \because$
Theorem \ref{t:leo-memo-fleeting closure},
\eqref{t:leo-reconstruction-wellformedness-40d},
\eqref{t:leo-reconstruction-wellformedness-40e},
\eqref{t:leo-reconstruction-wellformedness-40g};
}
\\
\label{t:leo-reconstruction-wellformedness-40k}
& \myparbox{
$\vatp{\Vleo{memo}}{\ref{line:reconstruct-memoized-eims-loop-46}}{\var{i}}
= \Vleo{next}
\because$
\eqref{t:leo-reconstruction-wellformedness-40b},
line \ref{line:reconstruct-memoized-eims-loop-46};
}
\\
\label{t:leo-reconstruction-wellformedness-40m}
& \myparbox{\vatp{\Vleo{memo}}{\var{top}}{\Vincr{i}} is instantiated
$\because$
line \ref{line:reconstruct-memoized-eims-loop-first};
}
\\
\label{t:leo-reconstruction-wellformedness-40o}
& \vatp{\Vleo{memo}}{\ref{line:reconstruct-memoized-eims-loop-46}}{\var{i}}
= \vatp{\Vleo{memo}}{\var{top}}{\Vincr{i}}
\because \text{Algorithm \ref{alg:reconstruct-memoized-eims}}
\\
\label{t:leo-reconstruction-wellformedness-40q}
& \vatp{\Veim{up}}{\ref{line:reconstruct-memoized-eims-loop-43}}{\var{i}}
= \vatp{\Veim{up}}{\var{top}}{\Vincr{i}}
\because \text{Algorithm \ref{alg:reconstruct-memoized-eims}};
\\
\label{t:leo-reconstruction-wellformedness-40s}
& \myparbox{
\vatp{\Veim{up}}{\var{top}}{\Vincr{i}}
is valid and complete
$\because$
\eqref{t:leo-reconstruction-wellformedness-39},
\eqref{t:leo-reconstruction-wellformedness-40q};
}
\\
\label{t:leo-reconstruction-wellformedness-40u}
& \myparbox{
$\Memo{\vatp{\Veim{up}}{\var{top}}{\Vincr{i}}}
= \vatp{\Vleo{memo}}{\var{top}}{\Vincr{i}}
\because$
\eqref{t:leo-reconstruction-wellformedness-40i},
\eqref{t:leo-reconstruction-wellformedness-40k},
\eqref{t:leo-reconstruction-wellformedness-40o}.
}
\end{align}

\eqref{t:leo-reconstruction-wellformedness-40m}
\eqref{t:leo-reconstruction-wellformedness-40s}
and
\eqref{t:leo-reconstruction-wellformedness-40u}
are
\eqref{t:leo-reconstruction-wellformedness-10}
for $\var{x} = \Vincr{i}$,
and therefore the step of the induction.
With this we have the induction and the theorem.
\end{proof}

\begin{lemma}
\label{lem:reconstruction-effect}
In Algorithm \ref{alg:reconstruct-memoized-eims},
for every pass \var{p},
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{p}}
is the Leo effect of
\vatp{\Vleo{memo}}{\var{top}}{\var{p}}
and
\vatp{\Veim{up}}{\var{top}}{\var{p}}.
\end{lemma}

\begin{proof}
From
Theorem \ref{t:leo-reconstruction-wellformedness},
we know that
\begin{equation}
\label{lem:reconstruction-effect-10}
\begin{gathered}
\text{
\vatp{\Veim{up}}{\var{top}}{\var{p}}
is valid and complete;
}
\\
\text{
\vatp{\Vleo{memo}}{\var{top}}{\var{p}}
is instantiated; and
}
\\
\Memo{\vatp{\Veim{up}}{\var{top}}{\var{p}}}
= \vatp{\Vleo{memo}}{\var{top}}{\var{p}}.
\end{gathered}
\end{equation}
From
\eqref{lem:reconstruction-effect-10},
Theorem \ref{t:leo-effect}
and
lines \ref{line:reconstruct-memoized-eims-loop-20}--%
\ref{line:reconstruct-memoized-eims-loop-23} of
Algorithm \ref{alg:reconstruct-memoized-eims},
we see that
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{p}}
is the Leo effect
of
\vatp{\Vleo{memo}}{\var{top}}{\var{p}}
and
\vatp{\Veim{up}}{\var{top}}{\var{p}}.
\end{proof}

\begin{theorem}
\ttitle{Leo reconstruction termination}
\label{t:leo-reconstruction-termination}
Let \mycallname{Reconstruct} be as specified in
Algorithm \ref{alg:reconstruct-memoized-eims},
let \Vleo{leo} be an instantiated Leo memo,
and let \Veim{lb} be a valid EIM that matches
\Vleo{leo}.
Then
\begin{align}
\label{eq:leo-reconstruction-termination-10b}
& \myparbox{\Veim{lb} has a catena, call it \var{cat},
and the length of \var{cat} is the same as
the number of complete EIM's potentially added by
\call{Reconstruct}{\Veim{lb}}, and
}
\\
\label{eq:leo-reconstruction-termination-10d}
& \myparbox{\call{Reconstruct}{\Veim{lb}} terminates.}
\end{align}
\end{theorem}

\begin{proof}
Let \var{seq} be a sequence such that
\begin{equation}
\Vel{seq}{i} =
\begin{cases}
\text{\vat{\Vleo{memo}}{\ref{line:reconstruct-memoized-eims-preloop-20}},
if \var{i} = 0}
\\
\text{the top-down cause of \el{seq}{\Vdecr{i}}, otherwise}.
\end{cases}
\end{equation}
By the definition of catena, \var{seq} is a catena,
and by the definition of the catena of an EIM,
\var{seq} is the catena of \Veim{lb}.

Call a pass through the main loop, \var{p}.
In Algorithm \ref{alg:reconstruct-memoized-eims},
we see that pass \var{p}
potentially adds the contents of the fleeting closure
of 
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{p}}
to the Earley sets.
From Theorems \ref{t:leo-reconstruction-wellformedness}
and \ref{t:leo-effect},
we know that 
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{p}}
is a silo effect, and therefore that
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{p}}
is quasi-complete.
The fleeting closure
of \vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\var{p}},
which is \vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{p}},
is therefore a quasi-complete fleeting closure.
By theorem
\ref{t:quasi-complete-fleeting-closure-properties}
we know that
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{p}}
contains exactly one complete EIM.
Therefore
\begin{equation}
\label{eq:leo-reconstruction-termination-30}
\myparbox{each pass through the main loop
  potentially adds exactly one complete EIM.
}
\end{equation}

From Theorem \ref{t:leo-reconstruction-wellformedness},
and lines
\ref{line:reconstruct-memoized-eims-loop-46}
and
\ref{line:reconstruct-memoized-eims-loop-first}
of
Algorithm \ref{alg:reconstruct-memoized-eims},
we see that, in every pass through the main loop except
the last,
the main loop follows a new link of the catena of \Veim{lb}.
There is also a catena link initially associated with \Veim{lb},
\vat{\Vleo{leo}}{\ref{line:reconstruct-memoized-eims-preloop-5}},
so that
\begin{equation}
\label{eq:leo-reconstruction-termination-32}
\myparbox{the catena of \Veim{lb} has exactly one link
  for every pass through the main loop.
}
\end{equation}

From
\eqref{eq:leo-reconstruction-termination-30}
and \eqref{eq:leo-reconstruction-termination-32},
we see that
there is a link in the catena of \Veim{lb} for every
complete EIM potentially added by
the main loop.
This shows
\eqref{eq:leo-reconstruction-termination-10b}
of the requirements of this theorem.

By the definition of a catena, \var{seq} is a catena.
But, by Theorem
\ref{t:leo-catenas-are-finite}, a Leo catena must be finite.
So there must be an upper bound on \var{p}.
Therefore Algorithm \ref{alg:reconstruct-memoized-eims}
makes \var{p} or fewer passes through the main loop.
Therefore Algorithm \ref{alg:reconstruct-memoized-eims}
must terminate before the \Vincr{p}'th pass through
the main loop.
This shows
\eqref{eq:leo-reconstruction-termination-10d}
of the requirements of this theorem.
\end{proof}

Recall that
EIM's are potentially added
if and only if they are contained in
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\var{p}}
for some \var{p},
where \var{p} is a pass through the main loop.
Recall that we write
$\var{s1} + \var{s2}$,
for the concatenation of the series \var{s2} after the series
\var{s1}.
For the rest of this section,
let \var{sqsq}%
\index{recce-notation}{sqsq@\var{sqsq}!(\Vel{sqsq}{sqix})[\var{ix}]}
be a sequence of sequences of EIM's,
such that
\begin{equation}
\label{eq:def-sqsq}
\Vel{sqsq}{x} =
\begin{cases}
[ \lbrace \Veim{lb} \rbrace ],
& \text{if $\var{x} = 0$}
\\
[ \el{sqsq}{\Vdecr{x}} +
\vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\Vdecr{x}}
],
& \text{if $\var{x} \ge 1$}
\end{cases}
\end{equation}

\begin{theorem}
\ttitle{Leo reconstruction layer validity}
\label{leo-reconstruction-layer-validity}
Let \mycallname{Reconstruct} be as specified in
Algorithm \ref{alg:reconstruct-memoized-eims};
let \Vleo{leo} be an instantiated Leo memo;
let \Veim{lb} be a valid EIM that matches
\Vleo{leo};
and let \var{slo} be the set containing
\Veim{lb} and every EIM potentially added to the Earley tables
by 
the call
\call{Reconstruct}{\Veim{lb}}.
Then every element of \var{slo} is valid.
\end{theorem}

\begin{proof}
We proceed by induction
on the number of passes through the main loop.
Our induction hypothesis is
\begin{equation}
\label{eq:leo-reconstruction-layer-validity-IND}
\tag{IND}
\forall \; \var{a} : 0 \le \var{a} \le \Vlastix{(\Vel{sqsq}{x})}
  \implies \Valid{(\Vel{sqsq}{x})[\var{a}]}.
\end{equation}

We take $\var{x} = 0$.
as the basis of our induction.
From \eqref{eq:def-sqsq},
we see that
\begin{equation}
\label{t:leo-reconstruction-layer-validity-17}
\el{psl}{0} = [ \Veim{lb} ],
\end{equation}
where \el{psl}{0} satisfies
\eqref{eq:leo-reconstruction-layer-validity-IND} by assumption
for the theorem.

For the step of the induction, we assume that
\eqref{eq:leo-reconstruction-layer-validity-IND}
is true for $\var{x} = \var{i}$,
to show that
\eqref{eq:leo-reconstruction-layer-validity-IND}
is true for $\var{x} = \Vincr{i}$.
From
Lemma \ref{lem:reconstruction-effect}
and 
\eqref{eq:def-leo-effect-10}
of the definition of Leo effect
we know that,
if there is a pass \Vincr{i},
\begin{equation}
\label{t:leo-reconstruction-layer-validity-22a}
\myparbox{\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\Vincr{i}}
is valid.
}
\end{equation}
By assumption for the step,
\begin{equation}
\label{t:leo-reconstruction-layer-validity-24}
\forall \; \var{a} : 0 \le \var{a} \le \Vlastix{(\Vel{sqsq}{i})} \implies \Valid{(\Vel{sqsq}{i})[\var{a}]}.
\end{equation}
Let
\[
\var{next-mfc} = \vatp{\var{mfc}}{\ref{line:reconstruct-memoized-eims-loop-39}}{\Vincr{i}}
\]
From line \ref{line:reconstruct-memoized-eims-loop-39},
we know that \var{next-mfc}
is the fleeting closure of
\begin{equation}
\label{t:leo-reconstruction-layer-validity-25}
\vatp{\Veim{lasting}}{\ref{line:reconstruct-memoized-eims-loop-23}}{\Vincr{i}}.
\end{equation}
From
\eqref{t:leo-reconstruction-layer-validity-22a},
\eqref{t:leo-reconstruction-layer-validity-25}
and
Theorem \ref{t:partial-fleeting-closure-validity},
we know
that
\begin{equation}
\label{t:leo-reconstruction-layer-validity-26}
\forall \; \var{a} : 0 \le \var{a} \le \Vlastix{nextmfc} \implies \Valid{\Vel{nextmfc}{a}}.
\end{equation}
It will always the case that $\Vincr{i} \ge 1$,
so that
\eqref{eq:leo-reconstruction-layer-validity-IND} for the step follows
from
\eqref{eq:def-sqsq},
\eqref{t:leo-reconstruction-layer-validity-24}
and \eqref{t:leo-reconstruction-layer-validity-26}.
This shows the step of the induction, the induction
and the theorem.
\end{proof}

\begin{theorem}
\ttitle{Leo reconstruction silo effects}
\label{t:leo-reconstruction-silo-effects}
TODO: probably delete this.
Let \mycallname{Reconstruct} be as specified in
Algorithm \ref{alg:reconstruct-memoized-eims};
let \Vleo{leo} be an instantiated Leo memo;
let \Veim{lb} be a valid EIM that matches
\Vleo{leo};
and let \var{slo} be the set containing
\Veim{lb} and every EIM potentially added to the Earley tables
by 
the call
\call{Reconstruct}{\Veim{lb}}.
Then
\begin{align}
\label{eq:leo-reconstruction-silo-effects-5d}
& \el{slo}{0} = \Veim{lb}
\\
\label{eq:leo-reconstruction-silo-effects-5f}
& \begin{aligned}
& \forall \; \var{a} : 1 \le \var{a} \le \Vlastix{slo}
\\
& \qquad \implies
\text{\Vel{slo}{\var{a}} is the unique silo effect of \el{slo}{\Vdecr{a}}}
\end{aligned}
\end{align}
\end{theorem}

\begin{proof}
TODO: delete this.
\end{proof}

TODO: to here

\begin{definition}
\dtitle{Matching catena of Leo silo}
TODO: Do I need this?
\end{definition}

\begin{theorem}
\ttitle{Leo silo right recursion}
\label{t:leo-silo-rr}
Every layer of a Leo silo, except the bottom layer, is right-recursive.
\end{theorem}

\begin{proof}
TODO: redo.
\end{proof}

\begin{theorem}
\ttitle{Leo silos with common lower layers}
\label{leo-silo-common-lower-layers}
If a lower layer occurs in two Leo silos,
then both silos have the same top element.
\end{theorem}

\begin{proof}
Let \var{aslo} and \var{bslo} be two Leo silos
that share a common EIM, call it \var{ceim}.
From theorem
\ref{t:silo-location},
and by the definition of silo location,
we know that a silo shares
its location
with every EIM in the silo, so that
both silos have the same location:
\begin{equation}
\label{leo-silo-common-lower-layers-15}
    \Current{\Veim{eim}} = \Right{\Veim{aslo}} = \Right{\Veim{bslo}}.
\end{equation}

By Theorem
\ref{t:leo-silo-catena}
there is a catena \var{acat}
that contains
all the matching Leo memos
of the layers of \var{aslo},
and
there is a catena \var{bcat}
that contains
all the matching Leo memos
of the layers of \var{bslo}:
\begin{multline}
\label{leo-silo-common-lower-layers-21}
\forall \; \var{i} \; \exists \; \Vleo{l}, \Veim{eim}
: 0 \le \var{i} < \Vlastix{aslo} \\
\implies
\Veim{eim} = \Vel{aslo}{i}
\; \land \; \Vleo{l} = \Memo{\Veim{eim}}
\; \land \; \Vleo{l} \in \var{acat} \\
\shoveleft{
  \text{and} \quad
  \forall \; \var{i} \; \exists \; \Vleo{l}, \Veim{eim}
  : 0 \le \var{i} < \Vlastix{bslo}
} \\
\implies
\Veim{eim} = \Vel{bslo}{i}
\; \land \; \Vleo{l} = \Memo{\Veim{eim}}
\; \land \; \Vleo{l} \in \var{bcat}
\end{multline}
Let \Vleo{cleo} be the Leo memo that matches \Veim{cleo}.
From
\eqref{leo-silo-common-lower-layers-21} we have
\begin{equation}
\label{leo-silo-common-lower-layers-28}
\Vleo{cleo} \in \var{acat}
\; \land \;
\Vleo{cleo} \in \var{bcat}.
\end{equation}

By Theorem
\ref{t:catena-top-elements-identical}, all catena elements contain
the same dotted rule and origin.
Since by
\eqref{leo-silo-common-lower-layers-28},
\var{acat} and \var{bcat} share the element \Vleo{cleo},
we know that
\begin{multline}
\label{leo-silo-common-lower-layers-31}
\forall \; \Vleo{l1}, \Vleo{l2} : \\
\Vleo{l1} \in (\var{acat} \cup \var{bcat})
\; \land \;
\Vleo{l2} \in (\var{acat} \cup \var{bcat}) \\
\implies
\left(
\begin{gathered}
\DR{\Vleo{l1}} = \DR{\Vleo{l2}} \\
\land \quad \Left{\Vleo{l1}} = \Left{\Vleo{l2}}
\end{gathered}
\right)
\end{multline}

TODO: Fix the rest of this proof for Leo-top.

From
\eqref{leo-silo-common-lower-layers-31}
and the definition of a Leo top layer,
\begin{multline}
\label{leo-silo-common-lower-layers-34}
\forall \; \Vloc{curr}, \Vleo{l1}, \Vleo{l2} : \\
\Vleo{l1} \in (\var{acat} \cup \var{bcat})
\; \land \;
\Vleo{l2} \in (\var{acat} \cup \var{bcat}) \\
\implies
\op{Leo-top}{\Vleo{l1}, \Vloc{curr}}
= \op{Leo-top}{\Vleo{l2}, \Vloc{curr}}.
\end{multline}

Combining
\eqref{leo-silo-common-lower-layers-21}
with
\eqref{leo-silo-common-lower-layers-34},
we have
\begin{multline}
\label{leo-silo-common-lower-layers-37}
\forall \; \Veim{eim1}, \Veim{eim2} \;
\exists \; \Vleo{l1}, \Vleo{l2} : \\
\Veim{eim1} \in (\var{aslo} \cup \var{bslo})
\; \land \;
\Veim{eim2} \in (\var{aslo} \cup \var{bslo}) \\
\implies
\Vleo{l1} = \Memo{\Veim{eim1}}
\; \land \; \Vleo{l2} = \Memo{\Veim{eim2}}
\\
\; \land \;
\op{Leo-top}{\Vleo{l1}, \Vloc{curr}}
= \op{Leo-top}{\Vleo{l2}, \Vloc{curr}}
\end{multline}
In
\eqref{leo-silo-common-lower-layers-15},
we showed that both silos must have the same location
as their common layer: \Right{\Veim{comm}}.
Setting \Vloc{curr} in
\eqref{leo-silo-common-lower-layers-37}
to
\Right{\Veim{comm}}, we have the theorem.
\end{proof}

\begin{theorem}
\ttitle{EIM's in Leo silos}
\label{t:eims-in-leo-silos}
Every EIM in a Leo silo is a null-scan,
a read or
a reduction.
Also, if a read EIM is in a Leo silo,
it must be the bottom of the Leo silo.
\end{theorem}

\begin{proof}
By the definition of a Leo silo,
every EIM in a Leo silo is a silo layer.
From Theorem
\ref{t:silo-read-eim-layer},
we know that, if a read EIM is in
a silo, it is the bottom of the silo.
A Leo silo, by its definition,
is a section of a silo,
so that if a Leo silo
contains a read EIM,
it is the bottom of the Leo silo.
\end{proof}

\begin{theorem}
\ttitle{Leo silo minimum height}:
\label{leo-silo-minimum-height}
Every Leo silo contains a least two layers.
\end{theorem}

\begin{proof}
By theorem
\ref{t:leo-silo-catena},
every Leo silo has a catena consisting of
of all of its Leo memos.
By the same theorem,
every Leo silo has a complete EIM
for every element of its catena,
plus a top layer.
Every Leo silo, by definition has a bottom
layer with a matching Leo memo,
so every Leo silo has a catena whose length
is at least 1.
A Leo silo therefore contains at least
one complete EIM corresponding to a
Leo memo catena,
plus the top layer.
\end{proof}

\begin{theorem}
\ttitle{Silo outer layer distinctness}:
\label{silo-outer-layer-distinctness}
The top and bottom layer of a Leo silo
are distinct.
\end{theorem}

\begin{proof}
This theorem follows from
Theorems
\ref{leo-silo-minimum-height}
and
\ref{t:silo-layer-unique}.
\end{proof}

\begin{definition}
\dtitle{Maximal Leo silo}
Intuitively, a Leo silo is maximal if no other Leo silo
properly contains it.
More formally,
let \var{lsl1} be a Leo silo
and let \var{slo} be a maximal silo which contains it.
We say that
\var{lsl1} is a
\xdfn{maximal Leo silo}{maximal (Leo silo)}%
\index{recce-notation}{Max-Leo-Silo(lslo,slo)@\Vop{Max-Leo-Silo}{lslo,slo}}
with respect to \var{slo}
if and only if one of the following are true:
\begin{itemize}
\item
\el{lsl}{0} has no silo cause in \var{slo}.
\item
Let \Veim{cuz} be the silo cause of \el{lsl}{0}.
There is no Leo silo, \var{lsl2}, such that
$\var{lsl1} \subset \var{lsl2} \subseteq \var{slo}$ and
$\Veim{cuz} \in \var{lsl2}$.
\end{itemize}
\end{definition}

\begin{theorem}
\ttitle{Every Leo silo has a maximal silo}
\label{t:maximal-of-leo-silo}
Let \var{maxslo} be a maximal silo,
and let \var{lsl} be a Leo silo contained
in \var{maxslo}.
Then there is a maximal Leo silo with respect to \var{maxslo}
that contains \var{lsl}.
\end{theorem}

\begin{proof}
By the definition of maximal for a Leo silo,
if \var{lsl} is not its own maximal Leo silo with respect
to \var{maxslo},
then \var{lsl} is part of a Leo silo that properly contains \var{lsl}.

Let \var{lsseq} be a sequence
such that $\el{lsseq}{0} = \var{lsl}$
and
\el{lsseq}{\Vincr{i}} is a Leo silo
such that
\[
  \Vel{lsseq}{i} \subset \el{lsseq}{\Vincr{i}} \subseteq \var{maxslo}.
\]
If \Vel{lsseq}{i}
and \el{lsseq}{\Vincr{i}} both exist,
$\Vsize{\el{lsseq}{\Vincr{i}}} > \Vsize{\Vel{lsseq}{i}}$.
By Theorem \ref{t:silo-finite},
the size of any silo is finite,
so that the size of \var{maxslo} is finite.
Therefore, \Vsize{\var{maxslo}}
is a maximum beyond which
the elements of \var{lsseq} cannot grow.
Since every element of \var{lsseq} must be properly larger
than the previous one,
the length of the sequence \var{lsseq} is finite.
So there is a last element of \var{lsseq}.

We now consider the Leo silo \el{lsseq}{\Vlastix{lsseq}}.
\el{lsseq}{\Vlastix{lsseq}}
is not properly contained in any other Leo silo.
And, by the construction of \var{lsseq},
\[
\begin{gathered}
\forall \; \var{i} : \var{lsl} \subseteq \Vel{lsseq}{i} \\
\therefore \quad
\var{lsl} \subseteq \el{lsseq}{\Vlastix{lsseq}}.
\end{gathered}
\]
Therefore, by the definition of a maximal Leo silo,
\el{lsseq}{\Vlastix{lsseq}} is
the maximal Leo silo for \var{lsl0} with respect
to \var{maxslo}.
\end{proof}

\begin{theorem}
\ttitle{Leo top maximality}
\label{t:leo-top-maximality}
Let \var{maxslo} be a maximal silo,
and let \var{lsl} be a Leo silo contained
in \var{maxslo}.
The top of a Leo silo
is also the top of its Leo maximal silo with respect
to \var{maxslo}.
\end{theorem}

\begin{proof}
By Theorem
\ref{t:maximal-silo}, there is a \var{maxslo}.
Let \var{maxlsl} be the maximal Leo silo of
\var{lsl} with respect to \var{maxslo}.
By Theorem
\ref{t:maximal-of-leo-silo},
\var{maxlsl} exists and
\begin{equation}
\label{eq:leo-top-maximality-10}
\var{lsl} \subseteq \var{maxlsl}.
\end{equation}
If $\var{lsl} = \var{maxlsl}$, the theorem follow trivially.

It remains to show the theorem in the case that
$\var{lsl} \neq \var{maxlsl}$.
By Theorem
\ref{leo-silo-minimum-height},
the minimum height of \var{lsl} is 2,
and it contains a lower layer, call it \Veim{ll}.
By
\eqref{eq:leo-top-maximality-10},
\var{maxlsl} also contains \Veim{ll}.
Theorem
\ref{leo-silo-common-lower-layers},
tells us two Leo silos with
a common lower layer have the same top layer,
so that
\[
   \el{lsl}{\Vlastix{lsl}} = \el{maxlsl}{\Vlastix{maxlsl}}.\qedhere
\]
\end{proof}

% \begin{theorem}
% If two Leo silos overlap,
% either
% \begin{itemize}
% \item
% the overlap is only of a single layer,
% which is the top of one and the bottom of the other; or
% \item
% one Leo silo contains the other.
% \end{itemize}
% \end{theorem}
%
% \begin{proof}
% TODO
% \end{proof}

\section{Memoized EIM's}

% \begin{definition}
% \dtitle{Memoable EIM's}
% Let \var{slo} be a silo and
% \Veim{eim} be an EIM.
% \Veim{eim} is said to be
% \dfn{Leo memoable} in \var{slo},
% or more simply,
% \dfn{memoable} in \var{slo},
% if and only if every layer in its fleeting closure
% is an inner layer.
% To say that
% \Veim{eim} is memoable in \var{slo},
% we also write \Memoable{\Veim{eim}}{\var{slo}}%
% \index{recce-notation}{Memoable(eim,slo)@\Memoable{\var{eim}, \var{slo}}}.
% \end{definition}

Intuitively, before memoizing an EIM we want to be sure
of two things: that it can be restored,
and that its memoization does not interfere with
the restoration of any other memoized items.
To do this, we require that it always occur
as an inner layer of
a Leo silo;
and that it not be the top or bottom of a maximal
Leo silo.

\begin{definition}
\dtitle{Memoized EIM's}
Let \Veim{eim} be an EIM
and let \var{mfc} be the maximal fleeting closure
which contains it.
\Veim{eim} is
\xdfn{memoized}{memoized (EIM)}
if and only if
for every maximal silo,
call it \var{maxslo},
we have all
of the following:
\begin{align}
\label{eq:def-memoized-eim-10}
&
\begin{aligned}
& \text{If $\Veim{eim} \in \var{maxslo}$ then} \\
& \qquad \text{there is an \var{lsl} such that} \\
& \qquad \qquad \left(
\begin{gathered}
\Leosilo{\var{lsl}}
\land \; \var{lsl} \subseteq \var{maxslo} \\
\land \; \Veim{eim} \in \var{lsl}.
\end{gathered}
\right)
\end{aligned}
\\
\label{eq:def-memoized-eim-20}
&
\begin{aligned}
& \text{There is no \var{lsl} such that} \\
& \qquad \qquad
\Maxleosilo{\var{lsl}}{\var{maxslo}} \; \land \;
  \el{lsl}{\Vlastix{lsl}} \in \var{mfc}.
\end{aligned}
\\
\label{eq:def-memoized-eim-30}
&
\begin{aligned}
& \text{There is no \var{lsl} such that} \\
& \qquad \qquad
\Maxleosilo{\var{lsl}}{\var{maxslo}} \; \land \;
  \el{lsl}{0} \in \var{mfc}.
\end{aligned}
\end{align}
\end{definition}

Note that
\eqref{eq:def-memoized-eim-10}
requires
that an EIM always occur as a layer of a Leo silo,
but does not include
the intuitive requirement that the EIM be an inner layer.
This is because
\eqref{eq:def-memoized-eim-20}
and
\eqref{eq:def-memoized-eim-30}
do that job adequately.
Also note that
\eqref{eq:def-memoized-eim-20}
and
\eqref{eq:def-memoized-eim-30}
treat all the
EIM's in a fleeting closure as if they are
memoized as a unit.
This makes sense from an implementation point of
view, and it is how Marpa is implemented.

\begin{theorem}
\label{t:leo-quasi-complete}
Only quasi-complete EIM's are
Leo-memoized.
\end{theorem}

\begin{proof}
By the definition of memoized, all memoized EIM's are
silo layers.
All silo layers are,
by the definition of a silo,
quasi-complete.
\end{proof}

\begin{theorem}
\label{t:no-memoized-predictions}
No quasi-prediction is memoized.
\end{theorem}

\begin{proof}
This theorem follows from
Theorem \ref{t:leo-quasi-complete}
and Theorem \ref{t:quasi-drs-disjoint}.
\end{proof}

\begin{theorem}
\label{t:earley-set-0-is-Leo-free}
No EIM in Earley set 0 is memoized.
\end{theorem}

\begin{proof}
By definition,
a quasi-complete EIM has at least one
telluric predot symbol,
so its current location cannot be location 0.
Therefore no quasi-complete EIM occurs in
Earley set 0.
But,
by Theorem \ref{t:leo-quasi-complete},
only quasi-complete EIM's are memoized.
Therefore no EIM in Earley set 0
is memoized.
\end{proof}

\begin{theorem}
\ttitle{Fleeting closure memoization}
\label{t:fleeting-closure-memoization}
Let \Veim{x} and
\Veim{y} be two EIM's in the same
fleeting closure.
Then
\[
\Memoized{\Veim{x}} \equiv \Memoized{\Veim{y}}.
\]
\end{theorem}

\begin{proof}
Since \Veim{x} and \Veim{y} are in the same fleeting
closure,
by Theorem
\ref{t:fleeting-closure-maximization}
they are also in the same maximal fleeting closure.
Call this \var{mfc}, so that
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-13}
\myparbox{$\Veim{x} \in \var{mfc}, \Veim{y} \in \var{mfc}$
and \var{mfc} is the maximal fleeting closure of both
\Veim{x} and
\Veim{y}}
\end{equation}

For the purposes of this proof, we will say that
the Leo silo \var{lsl} is ``potentially maximal'' if
there is some \var{maxslo} such that
\[
\Silo{\var{maxslo}}
\; \land \; \Maximal{\var{maxslo}}
\; \land \; \Maxleosilo{\var{lsl}}{\var{maxslo}}.
\]

\textbf{Case 1}:
We first consider the case where
\var{mfc} contains the top
of a potentially maximal Leo silo.
By the definition of memoized,
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-15}
\neg \Memoized{\Veim{x}} \; \land \; \neg \Memoized{\Veim{y}},
\end{equation}
From \eqref{eq:lem-fleeting-closure-memoization-15}
we have the theorem for this case.

\textbf{Case 2}:
We next consider the case where
\var{mfc} contains the bottom of a
potentially maximal Leo silo.
Again,
by the definition of memoized,
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-17}
\neg \Memoized{\Veim{x}} \; \land \; \neg \Memoized{\Veim{y}},
\end{equation}
and from \eqref{eq:lem-fleeting-closure-memoization-17}
we have the theorem for this case.

\textbf{Case 3}:
For the theorem,
it remains to consider the case where
\var{mfc} does not contain
either
the top of a Leo silo or
the bottom of a maximal Leo silo.
More formally, there is the case where we have
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-20}
\begin{aligned}
& \text{for all \var{maxslo}, \var{lsl} there is no \Veim{eim} such that} \\
& \qquad
\begin{aligned}
& \Veim{eim} \in \var{mfc} \\
\land \; & \Silo{\var{maxslo}} \; \land \; \Maximal{\var{maxslo}} \\
\land \; & \Maxleosilo{\var{lsl}}{\var{maxsilo}} \\
\land \; &
(\Veim{eim} = \el{lsl}{0}
\; \lor \;
\Veim{eim} = \el{lsl}{\Vlastix{lsl}}).
\end{aligned}
\end{aligned}
\end{equation}

\textbf{Outer implication of case 3}:
To show the forward implication for the theorem,
we assume
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-26}
\Memoized{\Veim{x}}
\end{equation}
to show
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-26a}
\Memoized{\Veim{y}}.
\end{equation}
Note that the definitions and assumptions
for \Veim{x} and \Veim{y} are symmetric,
so that our choice to show the forward implication
of the theorem
is without loss of generality.

To show
\Memoized{\Veim{y}},
we must prove that,
for all maximal silos,
we satisfy all three parts of the definition
for $\Veim{eim} \gets \Veim{y}$.
We proceed by assuming,
without loss of generality,
that \var{maxslo} is a maximal silo,
and showing
that we have \eqref{eq:def-memoized-eim-10}
for $\Veim{eim} \gets \Veim{y}$;
\eqref{eq:def-memoized-eim-20}
for $\Veim{eim} \gets \Veim{y}$;
and
\eqref{eq:def-memoized-eim-30}
for $\Veim{eim} \gets \Veim{y}$.

\eqref{eq:lem-fleeting-closure-memoization-20}
shows
\eqref{eq:def-memoized-eim-20}
for $\Veim{eim} \gets \Veim{y}$.
\eqref{eq:lem-fleeting-closure-memoization-30}
shows
\eqref{eq:def-memoized-eim-30}
for $\Veim{eim} \gets \Veim{y}$.
It remains to show
\eqref{eq:def-memoized-eim-10} for $\Veim{eim} \gets \Veim{y}$.

\textbf{Inner implication of case 3}:

\eqref{eq:def-memoized-eim-10}
is an implication.
To show it,
we create an inner implication
by assuming
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-30}
\Veim{y} \in \var{maxslo}
\end{equation}
to show that there is a \var{lsly} such that
\begin{gather}
\label{eq:lem-fleeting-closure-memoization-32}
\Leosilo{\var{lsly}} \\
\label{eq:lem-fleeting-closure-memoization-32a}
\; \land \; \Veim{y} \in \var{lsly} \\
\label{eq:lem-fleeting-closure-memoization-32b}
\; \land \; \var{lsly} \subseteq \var{maxslo}
\end{gather}

From Theorem
\ref{t:maximal-fleeting-silo-in-maximal-silo}
we know that if a maximal silo contains an EIM,
it contains the entire maximal fleeting closure
of that EIM.
Therefore
\begin{align}
\label{eq:lem-fleeting-closure-memoization-32d}
& \var{mfc} \subseteq \var{maxslo}.
&&
\text{Th \ref{t:maximal-fleeting-silo-in-maximal-silo}},
\eqref{eq:lem-fleeting-closure-memoization-30},
\eqref{eq:lem-fleeting-closure-memoization-13}
\\
\label{eq:lem-fleeting-closure-memoization-32d1}
& \Veim{x} \in \var{mfc}
&& \eqref{eq:lem-fleeting-closure-memoization-13}
\\
\label{eq:lem-fleeting-closure-memoization-32e}
& \Veim{x} \in \var{maxslo}
&& \eqref{eq:lem-fleeting-closure-memoization-32d},
\eqref{eq:lem-fleeting-closure-memoization-32d1}
\end{align}
In
\eqref{eq:lem-fleeting-closure-memoization-26},
we assumed $\Memoized{\Veim{x}}$ for the outer
implication.
From this,
the definition of memoized
and \eqref{eq:lem-fleeting-closure-memoization-32e},
we know that
there must exist some \var{lslx} such that
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-36}
\begin{gathered}
\Leosilo{\var{lslx}} \\
\land \; \Veim{x} \in \var{lslx} \\
\land \; \var{lslx} \subseteq \var{maxslo}
\end{gathered}
\end{equation}

From Theorem
\ref{t:maximal-of-leo-silo} we know that every Leo silo
that is contained in \var{maxslo}
is contained in a Leo silo
that is maximal
with respect to \var{maxslo}.
Therefore,
we know that there is a
\var{mlslx} such that
\begin{gather}
\label{eq:lem-fleeting-closure-memoization-40}
\Maxleosilo{\var{mlslx}}{\var{maxslo}} \\
\label{eq:lem-fleeting-closure-memoization-43}
\land \; \Veim{x} \in \var{mlslx} \\
\label{eq:lem-fleeting-closure-memoization-46}
\land \; \var{mlslx} \subseteq \var{maxslo}
\end{gather}

Theorem \ref{t:sequence-overlap} tells us that,
if two subsequences are contained in another sequence,
and the first subsequence does not contain the top or bottom of the
second subsequence,
the either the second subsequence contains all of the the first subsequence,
or they are disjoint.
Let our two subsequences be \var{mfc} and \var{mlslx},
and let the sequence that contains them be \var{maxslo}.
At this point we know that
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-49}
\begin{aligned}
& \el{mlslx}{0} \notin \var{mfc}
&& \eqref{eq:lem-fleeting-closure-memoization-20}
\\
& \el{mlslx}{\Vlastix{lslx}} \notin \var{mfc}
&& \eqref{eq:lem-fleeting-closure-memoization-20}
\\
& \Veim{x} \in \var{mfc}
&& \eqref{eq:lem-fleeting-closure-memoization-13}
\\
& \Veim{y} \in \var{mfc}
&& \eqref{eq:lem-fleeting-closure-memoization-13}
\\
& \var{mlslx} \subseteq \var{maxslo}
&& \eqref{eq:lem-fleeting-closure-memoization-46}
\\
& \var{mfc} \subseteq \var{maxslo}
&& \eqref{eq:lem-fleeting-closure-memoization-32d}
\end{aligned}
\end{equation}
From
\eqref{eq:lem-fleeting-closure-memoization-49}
and Theorem \ref{t:sequence-overlap}
we obtain
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-52}
\Veim{x} \in \var{mlslx} \equiv
\Veim{y} \in \var{mlslx}
\end{equation}
From
\eqref{eq:lem-fleeting-closure-memoization-43}
and \eqref{eq:lem-fleeting-closure-memoization-52},
we have
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-54}
\Veim{y} \in \var{mlslx}.
\end{equation}
We are now in a position to show that we have
a \var{lsly} which satisfies
\eqref{eq:lem-fleeting-closure-memoization-32}.
Let
\begin{equation}
\label{eq:lem-fleeting-closure-memoization-57}
\var{lsly} = \var{mlslx}.
\end{equation}
Then
\begin{align}
& \Leosilo{\var{lsly}}
&& \eqref{eq:lem-fleeting-closure-memoization-40},
\eqref{eq:lem-fleeting-closure-memoization-57}
\\
& \Veim{y} \in \var{lsly}
&& \eqref{eq:lem-fleeting-closure-memoization-54},
\eqref{eq:lem-fleeting-closure-memoization-57}
\\
& \var{lslx} \subseteq \var{maxslo}
&& \eqref{eq:lem-fleeting-closure-memoization-46},
\eqref{eq:lem-fleeting-closure-memoization-57}
\end{align}
This shows the inner implication
and therefore
\eqref{eq:def-memoized-eim-10} for $\Veim{eim} = \Veim{y}$.

\textbf{Conclusion}:
From the inner implication, we have
$\Memoized{\Veim{y}}$ and therefore the outer implication.
The outer implication was a forward implication,
\[
\Memoized{\Veim{x}} \implies \Memoized{\Veim{y}},
\]
but, as noted, the order of \Veim{x} and \Veim{y} was
chosen without loss of generalization.
So by showing the forward implication,
we have also shown
the reverse implication,
and therefore the mutual implication
in the statement of the theorem.
With the mutual implication,
we have Case 3, and therefore the theorem.
\end{proof}

\begin{theorem}
\ttitle{Ethereral closure of unmemoized base}
\label{ethereral-closure-of-unmemoized-base}
If the base of an ethereal closure is
not memoized,
no EIM in that ethereal closure will be memoized.
\end{theorem}

\begin{proof}
By the definition of an ethereal closure,
all of its elements are its base,
predictions, or the null-scan of some other
element of the ethereal closure.
By assumption for the theorem,
the base is not memoized.
By Theorem
\ref{t:no-memoized-predictions},
no prediction is memoized.

It remains to show theorem for null-scans.
Every null-scan is \Veim{ns}
such that
\Veim{ns} = \iop{null-scan-op}{\var{i}}{\Veim{fc0}}
for some $\var{i} > 0$,
where \Veim{fc0} is either the base of the ethereal
closure or a predction.
If \Veim{fc0} is a prediction,
\Veim{cuz} is a quasi-prediction.
By Theorem
\ref{t:no-memoized-predictions},
no quasi-prediction is memoized.

If \Veim{fc0} is the base of the ethereal closure then,
by the definition of a fleeting closure,
\Veim{ns} is in the fleeting closure of \Veim{fc0}.
\Veim{fc0} was unmemoized by assumption for the theorem,
so that by Theorem
\ref{t:fleeting-closure-memoization},
\Veim{ns} is not memoized.
\end{proof}

\begin{theorem}
\ttitle{Reads not memoized}
\label{t:read-eim-not-leo}
Read EIM's and the EIM's in the
ethereal closure of a read EIM
are never Leo-memoized.
\end{theorem}

\begin{proof}
Call a read EIM, \Veim{scanned}.
If \Veim{scanned} is not in a Leo silo,
by the definition of memoized,
\Veim{scanned} is not memoized.

By
Theorem
\ref{t:eim-maximal-silo},
if \Veim{scanned} is in a Leo silo,
then \Veim{scanned}
is in a maximal Leo silo,
call it \var{maxslo}.
By Lemma
\ref{t:silo-read-eim-layer},
\Veim{scanned}
is the bottom of every silo it is in,
so that \Veim{scanned}
is the bottom of \var{maxslo},
and therefore
\Veim{scanned}
is the bottom of a maximal Leo silo.
By the definition of memoized,
the bottom of a maximal Leo silo is
never memoized.
Therefore
\begin{equation}
\label{eq:read-eim-not-leo-10}
\neg \; \Memoized{\el{maxslo}{0}}.
\end{equation}

This theorem
follows from
\eqref{eq:read-eim-not-leo-10}
and Theorem
\ref{ethereral-closure-of-unmemoized-base}.
\end{proof}

\begin{theorem}
\ttitle{Only silo causes are memoized}
\label{t:only-silo-causes-memoized}
If \Veim{cuz} is memoized, whenever
it is a cause, it is a Leo silo cause.
\end{theorem}

\begin{proof}
By the definition of Leo memoized,
\Veim{cuz} must occur in a Leo silo,
call it \var{lsl}.
Also, \Veim{cuz} must be not be the top
of any maximal Leo silo.
Since, by Theorem
\ref{t:leo-top-maximality},
the top of \var{lsl} is the top of the Leo maximal silo
containing \var{lsl}
with respect to every maximal silo that containg \var{lsl},
\Veim{cuz} cannot be the top of any Leo silo.
If \Veim{cuz} is not the top of any Leo silo,
it has a silo effect.
By Theorem \ref{t:leo-silo-validity},
the effect of \Veim{cuz} will be unique.
Call this unique effect, \Veim{eff}.
\Veim{cuz} is a Leo silo cause of \Veim{eff}.
And, since \Veim{eff} is the unique effect
of \Veim{cuz}, \Veim{cuz} is a Leo silo cause
whenever it is a cause.
\end{proof}

\begin{theorem}
\label{t:memoized-effects}
If an EIM is unmemoized,
either it has an unmemoized silo cause
or it is a top item in some Leo silo.
\end{theorem}

\begin{proof}
TODO: revise

Let \Veim{eff} and \Veim{cuz} be valid EIM's
such that \Veim{cuz} is the cause of \Veim{eff}.
Assume for a reductio that
\begin{gather}
\label{eq:memoized-effects-10}
\myparbox{\Veim{eff} is unmemoized,
} \\
\label{eq:memoized-effects-12}
\myparbox{\Veim{eff} is not the top item
in any Leo silo; and
} \\
\label{eq:memoized-effects-14}
\myparbox{\Veim{cuz} is memoized.
}
\end{gather}

By the definition of memoized,
if \Veim{cuz} is memoized, it occurs only in Leo
silos, and \Veim{cuz} is not the top of any maximal Leo silo.
By Theorem \ref{t:leo-top-maximality},
since \Veim{cuz} is not top of any maximal Leo silo,
it is not the top of any Leo silo.
Therefore, \Veim{cuz} must have an effect.

By Theorem \ref{t:leo-silo-validity}
an effect of an inner Leo silo layer is another Leo silo layer.
By \eqref{eq:memoized-effects-12},
an assumption for the reductio,
\Veim{eff} is not the top layer in any Leo silos.
Because in all of those Leo silos,
\Veim{eff} is an effect of \Veim{cuz},
\Veim{eff} is not the bottom layer in any of those Leo silos.
Therefore \Veim{eff} is an inner layer in all of those Leo silos.
Therefore \Veim{eff} is memoable in all of its occurrences in
Leo silos.
\end{proof}

\begin{theorem}
\label{t:leo-memo-from-top}
Let \Veim{top} be a valid Leo top item.
Then a bottom-up cause which a Leo memo
for that top cause
will be valid and unmemoized.
\end{theorem}

\begin{proof}
TODO: revise

By the definition of Leo silo,
if \Veim{top} is a Leo top,
it is because there is
an instantianted Leo memo with a valid matching bottom.
Call the memo
\Vleo{leo},
and the bottom, \Veim{up}.
matches it.
By Theorem \ref{t:leo-silo-validity}
there is a valid silo with \Veim{up}
as its bottom.
A bottom EIM is not memoable.
If an EIM is not memoable in any of
its occurrences, then it is not memoized.
\end{proof}

\begin{theorem}
\label{t:accept-eim-not-memoized}
The accept EIM is never memoized.
\end{theorem}

\begin{proof}
By definition of the accept EIM,
it has no effect.
Therefore, if the accept EIM is in a Leo silo,
it is the top of a maximal Leo silo.
By the definition of memoized, the top of a maximal Leo silo
is not memoized.
\end{proof}

TODO: Finish?

\chapter{The Marpa Recognizer}
\label{ch:recce}
\label{ch:pseudocode}

\section{Complexity}

Alongside the pseudocode of this section
are observations about its space and time complexity.
In what follows,
we will charge all time and space resources
to Earley items,
or to attempts to add Earley items.
We will show that,
to each Earley item actually added,
or to each attempt to add a duplicate Earley item,
we can charge amortized \Oc{} time and space.

At points, it will not be immediately
convenient to speak of
charging a resource
to an Earley item
or to an attempt to add a duplicate
Earley item.
In those circumstances,
we speak of charging time and space
\begin{itemize}
\item to the parse; or
\item to the Earley set; or
\item to the current procedure's caller.
\end{itemize}

We can charge time and space to the parse itself,
as long as the total time and space charged is \Oc.
Afterwards, this resource can be re-charged to
the initial Earley item, which is present in all parses.
Soft and hard failures of the recognizer use
worst-case \Oc{} resource,
and are charged to the parse.

We can charge resources to the Earley set,
as long as the time or space is \Oc.
Afterwards,
the resource charged to the Earley set can be
re-charged to an arbitrary member of the Earley set,
for example, the first.
If an Earley set is empty,
the parse must fail,
and the time can be charged to the parse.

In a procedure,
resource can be ``caller-included''.
Caller-included resource is not accounted for in
the current procedure,
but passed upward to the procedure's caller,
to be accounted for there.
A procedure to which caller-included resource is passed will
sometimes pass the resource upward to its own caller,
although of course the top-level procedure does not do this.

For each procedure, we will state whether
the time and space we are charging is inclusive or exclusive.
The exclusive time or space of a procedure is that
which it uses directly,
ignoring resource charges passed up from called procedures.
Inclusive time or space includes
resource passed upward to the
current procedure from called procedures.

Earley sets may be represented by \Ves{i},
where \var{i} is the Earley set's location \Vloc{i}.
The two notations should be regarded as interchangeable.
The actual implementation of either
should be the equivalent of a pointer to
a data structure containing,
at a minium,
the Earley items,
a memoization of the Earley set's location as an integer,
and a per-set-list.
Per-set-lists will be described in Section \ref{s:per-set-lists}.

\begin{algorithm}[tb]
\algtitle{Marpa Top-level}{alg:top}
\begin{algorithmic}[1]
\Procedure{Main}{}
\State \Call{Initialization}{}
\label{line:top-20}
\For{ $\var{i}, 0 \le \var{i} \le \Vsize{w}$ }
\label{line:top-30}
\State \Call{Read pass}{$\var{i}, \var{w}[\Vdecr{i}]$}
\label{line:top-33}
\If{$\size{\Ves{i}} = 0$}
\State reject \Cw{} and return
\EndIf
\State \Call{Reduction pass}{\var{i}}
\label{line:top-40}
\EndFor
\If{$[\Vdr{accept}, 0] \in \Etable{\Vsize{w}}$}
\State accept \Cw{} and return
\EndIf
\State reject \Cw{}
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Top-level code}

Exclusive time and space for the loop over the Earley sets
is charged to the Earley sets.
Inclusive time and space for the final loop to
check for \Vdr{accept} is charged to
the Earley items at location \size{\Cw}.
Overhead is charged to the parse.
All these resource charges are obviously \Oc.

\section{Ruby Slippers parsing}
This top-level code represents a significant change
from previous versions of Earley's algorithm.
\call{Read pass}{} and \call{Reduction pass}{}
are separated.
As a result,
when the scanning of tokens that start at location \Vloc{i} begins,
the Earley sets for all locations prior to \Vloc{i} are complete.
This means that the scanning operation has available, in
the Earley sets,
full information about the current state of the parse,
including which tokens are acceptable during the scanning phase.


\begin{algorithm}[tb]
\algtitle{Initialization}{alg:initial}
\begin{algorithmic}[1]
\Procedure{Initial}{}
\State \Call{Add EIM set}{$\dr{start}, 0, 0$}
\label{line:initial-10}
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Initialization}
\label{p:initial-op}

\subsection{Initialization complexity}
\label{p:initial-op-complexity}
Inclusive time and space is \Oc{}
and is charged to the parse.

\subsection{Initialization correctness}
\label{p:initial-op-correct}

\begin{theorem}
\label{t:initial-op-correct}
Initialization is correct.
\end{theorem}

\begin{proof}
From Theorem
\ref{t:earley-set-0-is-Leo-free},
we know that Leo memoization has
no effect on the set of
EIM's in Earley set 0.

Since the bottom-up causes of both
reads and reductions
has an input length of greater than 0,
these EIM's cannot appear in Earley set 0.
All EIM's in Earley set 0 are therefore
\begin{itemize}
\item the start Earley item,
\item predictions, or
\item null-scans.
\end{itemize}

The set of start Earley items that we will
add to Earley set 0 is the singleton set
\begin{multline*}
\left\lbrace \bigl[ [ \Vsym{accept} \de \mydot \Vsym{start} ], 0, 0 \bigr] \right\rbrace \\
\text{where $[ \Vsym{accept} \de \mydot \Vstr{start} ]$ is the start rule.}
\end{multline*}
We first show that this set is correct.
It is consistent by theorem \ref{t:start-eim-is-valid}.
It is complete because the start rule is by definition unique.
Therefore the set of start EIM's
added by
Algorithm \ref{alg:initial} to Earley set 0
is correct.

TODO: Prove these next assertions.

The predictions and null-scans
must have a top-down cause in the same
Earley set.
Together, the predictions and null-scans
are exactly the EIM's with null transitions.
So null transition EIM's
must have some other EIM in Earley set 0
as either a direct or an indirect cause.
The start Earley item is
the only remaining possibility,
and it is in Earley set 0.
Therefore the start Earley item is the direct
or indirect cause of all other EIM's in Earley set 0.

From these considerations, we see that Earley 0
consists of the start Earley item and the transitive
closure of null transition from it.
By Theorem \ref{t:ethereal-closure-op-correct},
this is exactly the set of EIM's added to Earley set 0
in line
\ref{line:initial-10}
of Algorithm \ref{alg:initial}.
\end{proof}

\begin{algorithm}[tb]
\algtitle{Read pass}{alg:read-pass}
\begin{algorithmic}[1]
\Procedure{Read pass}{$\Vloc{i},\Vsym{up}$}
\State Note: Each pass through this loop is an EIM attempt
\For{each $\Veim{down} \in \var{transitions}((\var{i} \subtract 1),\Vsym{up})$}
\label{line:read-pass-18}
\State $[\Vdr{down}, \Vloc{origin}] \gets \Veim{down}$
\label{line:read-pass-20}
\State $\Vdr{effect} \gets \GOTO(\Vdr{down}, \Vsym{up})$
\State \Call{Add EIM set}{$\Vdr{effect}, \Vloc{origin}, \Vloc{i}$}
\label{line:read-pass-40}
\EndFor
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Read pass}
\label{p:read-op}

\subsection{Read pass complexity}
\label{p:read-op-complexity}

\var{transitions} is a set of tables, one per Earley set.
The tables in the set are indexed by symbol.
Symbol indexing is \Oc, since the number of symbols
is a constant, but
since the number of Earley sets grows with
the length of the parse,
it cannot be assumed that Earley sets can be indexed by location
in \Oc{} time.
For the operation $\var{transitions}(\Vloc{l}, \Vsym{s})$
to be in \Oc{} time,
\Vloc{l} must represent a link directly to the Earley set.
In the case of scanning,
the lookup is always in the previous Earley set,
which can easily be tracked in \Oc{} space
and retrieved in \Oc{} time.
Inclusive time and space can be charged to the
\Veim{down}.
Overhead is charged to the Earley set at \Vloc{i}.

\subsection{Read pass correctness}
\label{p:read-op-correct}

\begin{theorem}
\label{t:read-op-correct}
Call the
EIM's at \Vloc{i}
whose bottom-up cause is a terminal
symbol instance,
the ``EIM's read at \Vloc{i}``.
Let the Earley tables for all locations
\Vloc{h},
$\var{h} < \Vloc{i}$ be correct.
Then
Algorithm \ref{alg:read-pass}
at \Vloc{i}
adds all and only
the ethereal closure of
the EIM's read at \Vloc{i}.
\end{theorem}

\begin{proof}
We first assure ourselves that Leo
memoization has no effect on the read pass.
The bottom-up causes
in Algorithm
\ref{alg:read-pass}
are terminal symbol instances.
Leo memoizations are of EIM's ---
terminal instances are not Leo-memoized.

The top-down causes
in Algorithm
\ref{alg:read-pass}
must be quasi-incomplete because it is the result
of the \var{transitions} function,
which only memoizes EIM's with a telluric postdot
symbol ---
see line
\ref{line:memoize-transitions-20}
in Algorithm
\ref{alg:memoize-transitions}.
A quasi-complete EIM cannot have a
telluric postdot symbol,
so therefore
\Veim{down} at line
\ref{line:read-pass-20}
must be quasi-incomplete.
By Theorem
\ref{t:leo-quasi-complete},
no quasi-incomplete EIM
is Leo-memoized.
Therefore none of the EIM's used
in Algorithm
\ref{alg:memoize-transitions}
will be overlooked because
of Leo memoization.

By Theorem \ref{t:read-eim-not-leo},
read EIM's are never Leo-memoized.
We have now shown that none of the parse instances
referenced in Algorithm \ref{alg:read-pass},
are Leo-memoized.
We will therefore ignore Leo memoization in the
rest of this proof.

By the definition of \Cw{},
there is only one
terminal symbol instance
with right location \Vloc{i}.
Without loss of generality, let this instance be
\begin{equation}
\label{eq:read-op-correct-40}
\mkl{\var{i} \subtract 1} \,\, \Vsym{up} \Vmkr{i}
\end{equation}
The EIM's read at \Vloc{i}.
are the EIM's whose bottom-up cause
is \eqref{eq:read-op-correct-40}.

The definition of matching top-down cause
requires that \Veim{down} have a postdot symbol
of \Vsym{up} and a right location of
${\var{i} \subtract 1}$.
By theorem
\ref{t:memoize-transitions-correct},
the \var{transitions} function returns all of these for
use as the value of \Veim{down}
in the loop at line
\ref{line:read-pass-18}.

From this, we observe that
all and only
the matching pairs of causes
for the EIM's read at \Vloc{i}
are used to add EIM's
in the loop at line
\ref{line:read-pass-40}.
Call this the ``cause-correctness'' observation.

From the cause-correctness observation and
Theorem
\ref{t:effect-from-symbolic-cause-pair}
we know that the EIM's we attempt to add
at line
\ref{line:read-pass-40}
are consistent.
From the cause-correctness observation and
Theorem
\ref{t:symbolic-causes-from-effect}
we know that the EIM's we attempt to add
at line
\ref{line:read-pass-40}
are complete.

Since the EIM's we attempt to add
at line
\ref{line:read-pass-40}
are consistent and complete,
we know that,
at line
\ref{line:read-pass-40},
we attempted to add EIM's from
a correct set of causes
for the EIM's read at \Vloc{i}.
By Theorem
\ref{t:ethereal-closure-op-correct}
we know that the
Algorithm
\ref{alg:eim-set}
used
at line
\ref{line:read-pass-40}
adds the ethereal closure of
the EIM that is its argument.
Therefore, we did add
all of, and only, the EIM's
in the ethereal closure of the
EIM's read at \Vloc{i},
as required for the theorem.
\end{proof}

\section{Reduction pass complexity}
\label{p:reduction-op-complexity}

\begin{algorithm}[tb]
\algtitle{Reduction pass}{alg:reduction-pass}
\begin{algorithmic}[1]
\Procedure{Reduction pass}{\Vloc{i}}
\State Note: \Vtable{i} may include EIM's added by
\State \hspace{2.5em} by \Call{Reduce one up-cause}{} and
\State \hspace{2.5em} the loop must traverse these
\label{line:reduction-pass-18}
\For{each completed Earley item $\Veim{up} \in \Vtable{i}$}
\label{line:reduction-pass-20}
\State $[\Vdr{up}, \Vloc{origin}, \Vloc{dummy}] \gets \Veim{up}$
\State \Comment It is always the case that $\Vloc{dummy} = \Vloc{i}$
\State \Call{Reduce one up-cause}{\Vloc{i}, \Vloc{origin}, \LHS{\Vdr{lhs}}}
\EndFor
\label{line:reduction-pass-50}
\State \Call{Memoize transitions}{\Vloc{i}}
\EndProcedure
\end{algorithmic}
\end{algorithm}

The loop over \Vtable{i} must also include
any items added
by Algorithm \ref{alg:reduction-pass}.
This can be done by implementing \Vtable{i} as an ordered
set and adding new items at the end.

Exclusive time is clearly \Oc{} per
\Veim{work},
and is charged to the \Veim{work}.
Additionally,
some of the time required
by Algorithm \ref{alg:reduction-pass}
is caller-included,
and therefore charged to this procedure.
Inclusive time from
by Algorithm \ref{alg:reduction-pass}
is \Oc{} per call,
as will be seen in section \ref{p:reduce-one-up-cause},
and is charged to the \Veim{work}
that is current
during that call to
by Algorithm \ref{alg:reduction-pass}.
Overhead may be charged to the Earley set at \Vloc{i}.

\section{Reduction pass correctness}
\label{p:reduction-op-correct}

This section is devoted to showing that
Algorithm \ref{alg:reduction-pass} is correct.
In proving this, we will repeatedly employ two
``environmental''
assumptions.
Later we will show that both of those
assumptions are guaranteed
by the caller of
Algorithm \ref{alg:reduction-pass}.
For now, we will assume them explicitly
when needed.

The first ``environmental'' assumption is
\begin{equation}
\label{eq:reduction-op-correct-5}
\tag{ENV1}
\begin{aligned}
& \text{for all locations \Vloc{h},
and all symbols in \Cg{}, \Vsym{sym},
} \\
& \text{if $\var{h} < \Vloc{current}$,} \\
& \text{then-\Ves{h} is correct} \\
& \qquad \qquad
  \text{and $\var{transitions}(\var{h}, \Vsym{sym})$ is correct.}
\end{aligned}
\end{equation}
and the second ``environmental'' assumption is
\begin{equation}
\label{eq:reduction-op-correct-8}
\tag{ENV2}
\begin{aligned}
& \text{the ethereal closure of the set} \\
& \qquad \qquad \text{of EIM's read at \Vloc{current} is correct.}
\end{aligned}
\end{equation}

\begin{observation}
\label{obs:effect-eim}
For the purposes of this section,
we will call an EIM
added by
Algorithm \ref{alg:reduction-pass}
a ``reduction pass effect''.
From examining the pseudocode,
we observe that reduction pass effects
are added by
Algorithm \ref{alg:reduction-pass}
are added indirectly,
by the calls of \call{Add EIM set}{}
\begin{itemize}
\item
in Algorithm \ref{alg:earley-reduction-op}
at line \ref{line:earley-reduction-op-20}; and
\item
in Algorithm \ref{alg:leo-reduction-op}
at line \ref{line:leo-reduction-op-20}.
\end{itemize}
\end{observation}

\begin{lemma}
\label{lem:reduction-effect-validity}
\ltitle{Reduction Effect validity}
If the causes are valid, every attempt
by Algorithm \ref{alg:leo-reduction-op} to
add a reduction pass effect
adds
the ethereal closure of the
reduction pass effect.
\end{lemma}

\begin{proof}
From Theorem
\ref{t:effect-from-symbolic-cause-pair},
we know that the telluric base EIM's we attempt to add
at line
\ref{line:earley-reduction-op-20}
of Algorithm \ref{alg:earley-reduction-op}
are valid if their causes are valid.
From Theorem
\ref{t:leo-silo-validity},
we know that the telluric base EIM's we attempt to add
at line
\ref{line:leo-reduction-op-20}
of Algorithm \ref{alg:leo-reduction-op}
are valid if their causes are valid.
Combining both cases, we know that
every attempt to
add a telluric base EIM by Algorithm \ref{alg:reduction-pass}
is valid if its causes are valid.

By Theorem
\ref{t:ethereal-closure-op-correct}
we know that the
Algorithm
\ref{alg:eim-set}
used
at line
\ref{line:earley-reduction-op-20}
of Algorithm \ref{alg:earley-reduction-op}
and
at line
\ref{line:leo-reduction-op-20}
of Algorithm \ref{alg:leo-reduction-op}
adds the ethereal closure of the telluric base EIM's
added at those lines.
\end{proof}

\begin{theorem}
\label{t:reduction-op-correct}
Let \Veimset{reduced-base} be
the set of
unmemoized EIM's at \Vloc{current}
which are reductions ---
that is,
EIM's whose bottom-up cause is an EIM.
Let \Veimset{reduced-closure} be
the ethereal closure of \Veimset{reduced}.
If \eqref{eq:reduction-op-correct-5}
and \eqref{eq:reduction-op-correct-8},
then after Algorithm \ref{alg:reduction-pass}
runs,
the set of EIM's at \Vloc{current}
is correct for membership in \Veimset{reduced-closure}.
\end{theorem}

\begin{proof}


\textbf{Top-down correctness}:
Consider an arbitrary top-down cause of
a reduced EIM at \Vloc{current}.
Call this EIM, \Veim{down}.
Because \Veim{down} is the top-down cause
of a reduced EIM
Theorem
\ref{t:right-location-of-top-down-cause}
tells us that
\begin{equation}
\label{eq:reduction-op-correct-18}
\Right{\Veim{down}} < \Vloc{current}.
\end{equation}
From
\eqref{eq:reduction-op-correct-5},
an assumption for the theorem, and
\eqref{eq:reduction-op-correct-18}
we see that \Veim{down} is correct.
Since the choice of \Veim{down} as a top-down cause at
\Vloc{current} was without loss of generality,
we can state that
\begin{equation}
\label{eq:reduction-op-correct-21}
\myparbox{
All of the top-down causes used
by Algorithm \ref{alg:leo-reduction-op} are
correct.
}
\end{equation}

\textbf{Iteration sets}:
For the purposes of this proof we divide the EIM's
added by
Algorithm \ref{alg:reduction-pass} into a sequence
of sets,
\[\var{iter}[0], \var{iter}[1], \ldots \var{iter}[\var{n}].\]
$\var{iter}[0]$ is the set of EIM's
at line
\ref{line:reduction-pass-18} of Algorithm \ref{alg:reduction-pass},
before its main loop
from line
\ref{line:reduction-pass-20}
to line \ref{line:reduction-pass-50}.
$\var{iter}[\var{i}]$ is the set of EIM's
added during the \var{i}'th iteration of the main loop
of Algorithm \ref{alg:reduction-pass}.
Iterations are numbered starting with 1,
so that
$\var{iter}[1]$ is the set of EIM's
added during the first iteration of the main loop.

\textbf{Consistency and altitude}:
To show that
Algorithm \ref{alg:reduction-pass} adds only
valid EIM's,
we proceed by induction on the sets in \var{iter}.
Let the induction hypothesis be that
\begin{equation}
\label{eq:reduction-op-correct-21b}
\myparbox{the EIM's in \var{iter}[\var{i}] are valid, unmemoized
and at altitude \var{i}.}
\end{equation}
At line
\ref{line:reduction-pass-18} of Algorithm \ref{alg:reduction-pass},
\Ves{i} contains only read EIM's and their
ethereal closure.
From \eqref{eq:reduction-op-correct-8},
an assumption for the theorem,
we know that
the EIM's in \var{iter}[0] are valid and unmemoized.
By Definition \ref{def:altitude},
read EIM's have altitude 1.
Using Theorem \ref{t:ethereal-altitude},
we see that
all EIM's in the ethereal closure of read EIM's
have altitude 1.
So all EIM's in \var{iter}[0] have altitude 1.
This shows \eqref{eq:reduction-op-correct-21b} for $\var{i} = 0$,
which is the basis of our induction.

For the step, we assume
\eqref{eq:reduction-op-correct-21b}
and we seek to show that
\begin{equation}
\label{eq:reduction-op-correct-21c}
\myparbox{the EIM's in \var{iter}[\var{i}+1] are valid, unmemoized
and at altitude \var{i}+1.}
\end{equation}
For the EIM's in
$\var{iter}[\var{i}+1]$,
the top-down causes are valid by
\eqref{eq:reduction-op-correct-21}
and the bottom-up causes are valid by the assumption for the
induction step so that,
Lemma \ref{lem:reduction-effect-validity}
we see that
\begin{equation}
\label{eq:reduction-op-correct-23}
\myparbox{
all EIM's in
$\var{iter}[\var{i}+1]$ are valid.
}
\end{equation}

We next show that
all EIM's in
$\var{iter}[\var{i}+1]$
are unmemoized.
Again using
\eqref{eq:reduction-op-correct-21},
the induction step,
and Lemma \ref{lem:reduction-effect-validity},
we see that all of the causes
of EIM's in
$\var{iter}[\var{i}]$ are unmemoized.
We need to show that all of the EIM's in
$\var{iter}[\var{i}+1]$ are unmemoized.
By Theorem \ref{t:memoized-effects},
every memoized
effect either has a memoized cause,
or else is a Leo top EIM.
So if $\Veim{x} \in \var{iter}[\var{i}+1]$ is
memoized,
\Veim{x} must be a Leo top
EIM, and therefore must have a Leo memo.
From line
\ref{line:reduce-one-up-cause-25}
of Algorithm
\ref{alg:reduce-one-up-cause}
and from Theorem
\ref{t:leo-silo-validity},
we see that if \Veim{x} has a Leo memo,
line \ref{line:reduce-one-up-cause-30}
of Algorithm
\ref{alg:reduce-one-up-cause},
will add a valid, ummemoized EIM.
So
\begin{equation}
\label{eq:reduction-op-correct-24}
\myparbox{
every EIM $\Veim{x} \in \var{iter}[\var{i}+1]$ is
unmemoized.
}
\end{equation}

To determine their altitude, we look at
the EIM's added
to $\var{iter}[\var{i}+1]$ by cases.
There are two cases:
\begin{enumerate}
\item
\label{case:reduction-op-correct-24}
Case \ref{case:reduction-op-correct-24}:
Those added at
line \ref{line:earley-reduction-op-20}
of Algorithm \ref{alg:earley-reduction-op}; and
\item
\label{case:reduction-op-correct-25}
Case \ref{case:reduction-op-correct-25}:
those added
at line \ref{line:leo-reduction-op-20}
of Algorithm \ref{alg:leo-reduction-op}.
\end{enumerate}

For Case \ref{case:reduction-op-correct-24},
the EIM's added are
the ethereal closure of
the reduced EIM's whose bottom-up cause
is in $\var{iter}[\var{i}]$.
By Definition \ref{def:altitude}
and Theorem \ref{t:ethereal-altitude},
the EIM's of
Case \ref{case:reduction-op-correct-24}
have altitude $\var{i}+1$.
For Case \ref{case:reduction-op-correct-25},
the EIM's added are
the ethereal closure of
the Leo reduced EIM's whose bottom-up cause
is in $\var{iter}[\var{i}]$.
By Theorems
\ref{t:leo-silo-validity}
and \ref{t:ethereal-altitude},
the EIM's of
Case \ref{case:reduction-op-correct-24}
have altitude $\var{i}+1$.
In both cases, the EIM's added
have altitude $\var{i}+1$,
and therefore
\begin{equation}
\label{eq:reduction-op-correct-29}
\myparbox{
all EIM's in
$\var{iter}[\var{i}+1]$
have altitude $\var{i}+1$.
}
\end{equation}

Using
\eqref{eq:reduction-op-correct-23},
\eqref{eq:reduction-op-correct-24}
and
\eqref{eq:reduction-op-correct-29},
we have
\eqref{eq:reduction-op-correct-21c},
the step of the induction,
and the induction.
From this we conclude that
\begin{equation}
\label{eq:reduction-op-correct-30}
\forall \;
  \var{i}, \text{$\var{iter}[\var{i}]$ is consistent.}
\end{equation}
and
\begin{equation}
\label{eq:reduction-op-correct-31}
\forall \;
  \var{i}, \Alt{\var{iter}[\var{i}} = \var{i}.
\end{equation}

\textbf{Completeness of the iteration sets}:
To show that
after
Algorithm \ref{alg:reduction-pass} every set of
\var{iter} is complete,
we proceed by induction on the sets in \var{iter}.
Let the induction hypothesis be that
\begin{equation}
\label{eq:reduction-op-correct-35}
\myparbox{the EIM's in \var{iter}[\var{i}] are complete.}
\end{equation}
From \eqref{eq:reduction-op-correct-8},
an assumption for the theorem,
we have
\eqref{eq:reduction-op-correct-21b} for $\var{i} = 0$,
and this is the basis of our induction.

For the step, we assume
\eqref{eq:reduction-op-correct-35}
and we seek to show
\begin{equation}
\label{eq:reduction-op-correct-40}
\myparbox{the EIM's in \var{iter}[\var{i}+1] are complete.}
\end{equation}
For the EIM's in
$\var{iter}[\var{i}+1]$,
the top-down causes are complete by
\eqref{eq:reduction-op-correct-21}
and the bottom-up causes are complete by the assumption for the
induction step.
So we have complete sets of unmemoized, valid causes for
both bottom-up causes and top-down causes.

We now show that
Algorithm \ref{alg:reduction-pass}
pairs every bottom-up cause with
all of its matching top-down causes.
From line
\ref{line:reduction-pass-20}
of Algorithm
\ref{alg:reduction-pass}
we see that all valid unmemoized bottom-up causes
are used in an outer loop.
From Theorem
\ref{t:memoize-transitions-correct}
and
line
\ref{line:reduce-one-up-cause-20}
of Algorithm
\ref{alg:reduce-one-up-cause},
we see that each
of these unmemoized bottom-up causes
is paired with the matching set of valid top-down causes.

It remains to show that
no unmemoized, valid EIM's are omitted
from $\var{iter}[\var{i}+1]$
because their silo causes
are memoized.
By Theorem
\ref{t:memoized-effects},
all valid unmemoized items have valid unmemoized silo causes except
for Leo top items.
Without loss of generality,
let a Leo top item be
\Veim{top}.
In the case of \Veim{top},
by Theorem \ref{t:leo-memo-from-top},
there will be an valid unmemoized bottom-up cause
which matches the Leo memo,
so that
line \ref{line:reduce-one-up-cause-30}
of Algorithm
\ref{alg:reduce-one-up-cause}
will add the ethereal closure of \Veim{top}.
Therefore all unmemoized, valid EIM's are added
to
$\var{iter}[\var{i}+1]$.

This shows
\eqref{eq:reduction-op-correct-40},
the step of the induction,
and the induction.
From this we conclude that
\begin{equation}
\label{eq:reduction-op-correct-50}
\forall \;
  \var{i}, \text{$\var{iter}[\var{i}+1]$ is complete.}
\end{equation}

\textbf{Completeness}:
We have shown completeness for all of the Earley sets in
\eqref{eq:reduction-op-correct-50}.
The theorem requires that we show
completeness for \Ves{current} for
membership in \var{reduced-closure}
From
\eqref{eq:reduction-op-correct-30},
and \eqref{eq:reduction-op-correct-50},
we know that every iteration set is correct for
membership in \var{reduced-closure} ---
contains all and only the valid EIM's.
By Theorem
\ref{t:altitude-is-finite}
we know that every valid EIM has a defined,
finite altitude,
and by
\eqref{eq:reduction-op-correct-31},
we know every valid EIM is in the
iteration set whose index is the same
as the EIM's altitude.

It remains to show that the iteration sets
produced by
by Algorithm
\ref{alg:reduction-pass} capture all of the
reductions necessary.
The loop starting a line
\ref{line:reduction-pass-20}
of Algorithm
\ref{alg:reduction-pass} stops at the first
empty iteration set.
This is adequate if all iteration sets after
the first empty iteration set are also empty:
\begin{equation}
\label{eq:reduction-op-correct-60}
\var{iter}[\var{i}] = \emptyset \land \var{i} \le \var{j}
    \implies \var{iter}[\var{j}] = \emptyset.
\end{equation}
Showing \eqref{eq:reduction-op-correct-60} is the same
as showing that
\begin{equation}
\label{eq:reduction-op-correct-63}
\nexists \, \var{x},
    \var{iter}[\var{x}] = \emptyset \land
    \var{iter}[\var{x}+1] \neq \emptyset
\end{equation}
Suppose, for a reductio, that there was a
\var{x} that did not satisfy
\eqref{eq:reduction-op-correct-63}.
All EIM's in
$\var{iter}[\var{x}+1]$ will have altitude
$\var{x}+1$
and will be
\begin{enumerate}
\item
\label{case:reduction-op-correct-66}
Case \ref{case:reduction-op-correct-66}:
in the ethereal closure added
by Algorithm \ref{alg:earley-reduction-op}
at line \ref{line:earley-reduction-op-20}; or
\item
\label{case:reduction-op-correct-70}
Case \ref{case:reduction-op-correct-70}:
in the ethereal closure added
by Algorithm \ref{alg:leo-reduction-op}
at line \ref{line:leo-reduction-op-20}.
\end{enumerate}
In Case \ref{case:reduction-op-correct-66},
by Definitiion \ref{def:altitude},
they will require a bottom-up cause with
altitude \var{x}.
In Case \ref{case:reduction-op-correct-70},
also by Definitiion \ref{def:altitude},
they will again require a bottom-up cause with
altitude \var{x}.
But $\var{iter}[\var{x}] = \emptyset$ by assumption
for the reductio.
So there is no bottom-up cause that can create
the EIM's in either
Case \ref{case:reduction-op-correct-66}
or Case \ref{case:reduction-op-correct-70}.
This shows the reductio,
\eqref{eq:reduction-op-correct-63},
and therefore
\eqref{eq:reduction-op-correct-60}.

\begin{sloppypar}
\textbf{Correctness}:
Let
\[ \var{reduction-pass-eims} = \bigcup_\var{i} \var{iter}[\var{i}]. \]
From the considerations in the part on \textbf{Completeness}
we conclude that
\var{reduction-pass-eims}
is complete for \Veimset{reduced-closure}.
From
\eqref{eq:reduction-op-correct-30},
we know that
\var{reduction-pass-eims} is consistent.
Therefore,
\var{reduction-pass-eims}
is correct for \Veimset{reduced-closure}.

\end{sloppypar}
\end{proof}

\begin{algorithm}[tb]
\algtitle{Memoize transitions}{alg:memoize-transitions}
\begin{algorithmic}[1]
\Procedure{Memoize transitions}{\Vloc{i}}
\For{every \Vsym{postdot}, a telluric postdot symbol of $\Ves{i}$}
\label{line:memoize-transitions-20}
\State Note: \Vsym{postdot} is ``Leo-eligible" if it is
\State \hspace\algorithmicindent  Leo unique and its rule is right recursive
\If{\Vsym{postdot} is Leo-eligible}
\State Set $\var{transitions}(\Vloc{i},\Vsym{postdot})$
\State \hspace\algorithmicindent to a LEO
\Else
\State Set $\var{transitions}(\Vloc{i},\Vsym{postdot})$
\State \hspace\algorithmicindent to the set of EIM's at \Vloc{i} that have
\State \hspace\algorithmicindent \Vsym{postdot} as their postdot symbol
\EndIf
\EndFor
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Memoize transitions}

The \var{transitions} table for \Ves{i}
is built once all EIM's have been
added to \Ves{i}.
We first look at the resource,
excluding the processing of Leo memos.
The non-Leo processing can be done in
a single pass over \Ves{i},
in \Oc{} time per EIM.
Inclusive time and space are charged to the
Earley items being examined.
Overhead is charged to \Ves{i}.

We now look at the resource used in the Leo processing.
A transition symbol \Vsym{transition}
is Leo-eligible if it is Leo unique
and its rule is right recursive.
(If \Vsym{transition} is Leo unique in \Ves{i}, it will be the
postdot symbol of only one rule in \Ves{i}.)
All but one of the determinations needed to decide
if \Vsym{transition} is Leo-eligible can be precomputed
from the grammar,
and the resource to do this is charged to the parse.
The precomputation, for example,
for every rule, determines if it is right recursive.

One part of the test for
Leo eligibility cannot be done as a precomputation.
This is the determination whether there is only one dotted
rule in \Ves{i} whose postdot symbol is
\Vsym{transition}.
This can be done
in a single pass over the EIM's of \Ves{i}
that notes the postdot symbols as they are encountered
and whether any is enountered twice.
The time and space,
including that for the creation of a LEO if necessary,
will be \Oc{} time per EIM examined,
and can be charged to EIM being examined.

\begin{theorem}
\label{t:memoize-transitions-correct}
Algorithm \ref{alg:memoize-transitions}
is correct.
\end{theorem}

\begin{proof}
TODO: Make sure this accounts for the correctness of Leo memos.
TODO: Make sure this accounts for the completeness of all top-down causes.
\end{proof}

\begin{algorithm}[tb]
\algtitle{Reduce one up-cause}{alg:reduce-one-up-cause}
\begin{algorithmic}[1]
\Procedure{Reduce one up-cause}{\Veim{up}}
\State Note: Each pass through this loop is an EIM attempt
\State $\Vloc{orig} \gets \Left{\Veim{up}}$
\State $\Vsym{lhs} \gets \LHS{\Veim{up}}$
\State $\Vloc{current} \gets \Current{\Veim{up}}$
\For{each $\var{down} \in \var{transitions}(\var{orig},\var{lhs})$}
\label{line:reduce-one-up-cause-20}
\State \Comment \var{down} is a ``postdot item'', either a Leo memo or an EIM
\If{\var{down} is a Leo memo}
\label{line:reduce-one-up-cause-25}
\State Perform a \Call{Leo reduction operation}{}
\label{line:reduce-one-up-cause-30}
\State \hspace\algorithmicindent for operands \var{current}, \Vleo{down}
\Else
\State Perform a \Call{Earley reduction operation}{}
\label{line:reduce-one-up-cause-50}
\State \hspace\algorithmicindent for operands \var{current}, \Veim{down}, \var{lhs}
\EndIf
\EndFor
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Reduce one up-cause}
\label{p:reduce-one-up-cause}

To show that
\begin{equation*}
\var{transitions}(\Vloc{origin},\Vsym{lhs})
\end{equation*}
can be traversed in \Oc{} time,
we note
that the number of symbols is a constant
and assume that \Vloc{origin} is implemented
as a link back to the Earley set,
rather than as an integer index.
This requires that \Veim{work}
in \call{Reduction pass}{}
carry a link
back to its origin.
As implemented, Marpa's
Earley items have such links.

Inclusive time
for the loop over the EIM attempts
is charged to each EIM attempt.
Overhead is \Oc{} and caller-included.

\begin{algorithm}[tb]
\algtitle{Earley reduction operation}{alg:earley-reduction-op}
\begin{algorithmic}[1]
\Procedure{Earley reduction operation}{\Vloc{current}, \Veim{down}, \Vsym{up}}
\State $\Vdr{effect} \gets \GOTO(\DR{\Veim{down}}, \Vsym{up})$
\State \Call{Add EIM set}{\Vdr{effect}, \Left{\Veim{down}}, \var{current}}
\label{line:earley-reduction-op-20}
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Earley Reduction operation}
\label{p:reduction-op}

Exclusive time and space is clearly \Oc.
\call{Earley reduction operation}{} is always
called as part of an EIM attempt,
and inclusive time and space is charged to the EIM
attempt.

\begin{algorithm}[tb]
\algtitle{Leo reduction operation}{alg:leo-reduction-op}
\begin{algorithmic}[1]
\Procedure{Leo reduction operation}{\Vloc{current}, \Vleo{down}}
\State $[\Vdr{down}, \Vsym{up}, \Vloc{origin}] \gets \Vleo{down}$
\State $\Vdr{effect} \gets \GOTO(\DR{\Vdr{down}}, \Vsym{up})$
\State \Call{Add EIM set}{\Vdr{effect}, \Vloc{origin}, \var{current}}
\label{line:leo-reduction-op-20}
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Leo reduction operation}
\label{p:leo-op}

Exclusive time and space is clearly \Oc.
\call{Leo reduction operation}{} is always
called as part of an EIM attempt,
and inclusive time and space is charged to the EIM
attempt.

\begin{algorithm}[tb]
\algtitle{Add EIM set}{alg:eim-set}
\begin{algorithmic}[1]
\Procedure{Add EIM set}{$\Vdr{base}, \Vloc{origin}, Vloc{i}$}
\State $\Veim{confirmed} \gets [\Vdr{base}, \Vloc{origin}]$
\If{\Veim{base} is new}
\State Add \Veim{base} to \Vtable{i}\label{line:eim-set-10}
\EndIf
\State $\Vdrset{next} \gets \GOTO(\Vdr{base}, \epsilon)$\label{line:eim-set-20}
\For{every $\Vdr{next} \in  \Vdrset{next}$}
\If{\Vdr{next} is a quasi-prediction}
\State $\Veim{next} \gets [\Vdr{next}, \Vloc{i}, \Vloc{i}]$
\label{line:eim-set-25}
\If{\Veim{next} is new}
\State Add \Veim{next} to \var{table}\label{line:eim-set-30}
\EndIf
\Else
\State $\Veim{next} \gets [\Vdr{next}, \Vloc{origin}, \Vloc{i}]$
\label{line:eim-set-35}
\If{\Veim{next} is new}
\State Add \Veim{next} to \var{table}\label{line:eim-set-40}
\EndIf
\EndIf
\EndFor
\EndProcedure
\end{algorithmic}
\end{algorithm}

\section{Adding a set of Earley items}
\label{p:add-eim-set}

\subsection{Complexity}
\label{p:ethereal-closure-op-complexity}

This operation adds the ethereal closure
of a confirmed EIM
item.
Inclusive time and space is charged to the
calling procedure.

By theorem \ref{t:ethereal-closure-Oc},
computing the ethereal closure is \Oc{}.
We show that other time charged is also \Oc{}
by singling out the two non-trivial cases:
checking that an Earley item is new,
and adding it to the Earley set.
\Marpa{} checks whether an Earley item is new
in \Oc{} time
by using a data structure called a PSL.
PSL's are the subject of Section \ref{s:per-set-lists}.
An Earley item can be added to the current
set in \Oc{} time
if Earley set is seen as a linked
list, to the head of which the new Earley item is added.

The space required for added EIM added is at most
for the \Vdr{base},
one for every transition over a null postdot symbol,
and
one for every prediction.
The number of EIM's that result from
transitions over null postdot symbols is limited
by the maximum length of the RHS of a rule,
which is constant for a given \Cg{}.
At any \Vloc{i}, the number of predictions is
at most the number of rules in \Cg{}.
The number of EIM's that result from
predictions
is therefore constant for a given \Cg{}.
Summing the space, we see that all space
requirements are constant, so that the space
is \Oc{} per call.

\subsection{Prediction EIM complexity}
\label{p:prediction-op-complexity}

Looking specifically at predictions,
From the discussion in
\ref{p:ethereal-closure-op-complexity}, we see that
no time or space is ever charged
to a predicted Earley item.
At most one attempt to add a \Veim{predicted} will
be made per attempt to add a \Veim{confirmed},
so that the total resource charged
remains \Oc.

\subsection{Null transition correctness}
\label{p:prediction-op-correct}

\begin{theorem}
\label{t:ethereal-closure-op-correct}
Algorithm \ref{alg:eim-set} adds all and only the EIM's
for the ethereal closure of \Veim{base}.
\end{theorem}

\begin{proof}
We first examine the effect Leo memoization will
have
on Algorithm \ref{alg:eim-set}.
We note the
Algorithm \ref{alg:eim-set} is only called when
\Veim{base} is not Leo memoized.
By Theorem \ref{t:fleeting-closure-memoization},
we see that if \Veim{base} is not Leo memoized,
none of the other EIM's in its fleeting closure
will be Leo memoized.
By Theorem
\ref{t:no-memoized-predictions},
no prediction is ever memoized.
Therefore,
we may ignore Leo memoization in what follows.

TODO: Check the above assertion.

By inspection, we see that
Algorithm \ref{alg:eim-set} adds items
at lines
\ref{line:eim-set-10},
\ref{line:eim-set-30}
and \ref{line:eim-set-40}.
That the addition of \Veim{base}
at line \ref{line:eim-set-10}
is complete,
consistent and therefore correct,
follows directly from
inspection of
the pseudo-code.

Other than \Veim{base} itself,
all EIM's in the ethereal closure of
\Veim{base} are the product of
a series of null scans
and predictions.
These operations never change the current location ---
it will always be that of \Veim{base}.
The origin only changes if the operation is a prediction ---
the origin of a predictions is the same as its current
location.
This remains true for the null scan of a predictions ---
its origin is that of its top-down cause, but since
that top-down cause is a prediction,
the origin is the same as if it was a prediction.
By induction, we see that the origin of
all quasi predictions must be the same as
the current location of the prediction.

Let \Veim{new} be a EIM in the ethereal
closure,
other than \Veim{base} itself.
From the preceding analysis,
we see that
the current location of
\Veim{new}
depends
only
on its value in \Veim{base}.
The origin of \Veim{new} depends
on two things:
whether or not \Veim{new} is a quasi-prediction,
and the appropriate location value in \Veim{base}.

There is, therefore,
for each dotted rule,
only one correct set of values
for origin and current location.
These locations are
the ones
used by Algorithm \ref{alg:eim-set}
in lines
\ref{line:eim-set-25}
and \ref{line:eim-set-35}.
Therefore the set of correct EIM's corresponds
one-to-one
with the dotted rules
and, from inspection of
Algorithm \ref{alg:eim-set},
this is the set added by
Algorithm \ref{alg:eim-set}
at lines
\ref{line:eim-set-30}
and \ref{line:eim-set-40}.

It remains to show that the set of dotted rules on
which the EIM's added
at lines \ref{line:eim-set-30}
and \ref{line:eim-set-40}
are based
is correct.
The EIM's added at lines
\ref{line:eim-set-30}
and \ref{line:eim-set-40} are based on
the dotted rules found
at line
\ref{line:eim-set-20}.
By theorem \ref{t:ethereal-closure-dr-correct},
line \ref{line:eim-set-20} of
Algorithm \ref{alg:eim-set} the
transitive closure of null transitions from
the dotted rule \Veim{base} found
by line \ref{line:eim-set-20} is
complete, consistent and therefore correct.
\end{proof}

\begin{theorem}\label{t:quasi-complete-correct}
Let \Veim{base} be quasi-complete.
If Algorithm \ref{alg:eim-set} adds \Veim{base},
it also adds all null transitions from it,
including the completion EIM of \Veim{base}.
\end{theorem}

\begin{proof}
For null transitions,
the result follows directly
from theorem \ref{t:ethereal-closure-op-correct}.
By the definition of completion EIM,
a completion EIM is the result of null transition
from any of its quasi-completions,

TODO: Is this still right?

so that case also follows
from theorem \ref{t:ethereal-closure-op-correct}.
\end{proof}

\begin{theorem}\label{t:prediction-correct}
If Algorithm \ref{alg:eim-set} adds \Veim{base},
it also adds all predictions which are null transitions
from it,
including the valid quasi-prediction EIM's.
\end{theorem}

\begin{proof}
The predictions
and quasi-predictions are
null transitions form \Veim{base},
so the result follows directly
from theorem \ref{t:ethereal-closure-op-correct}.
\end{proof}

\section{Per-set lists}
\label{s:per-set-lists}

In the general case,
where \var{x} is an arbitrary datum,
it is not possible
to use duple $[\Ves{i}, x]$
as a search key and expect the search to use
\Oc{} time.
Within \Marpa, however, there are specific cases
where it is desirable to do exactly that.
This is accomplished by
taking advantage of special properties of the search.

If it can be arranged that there is
a link direct to the Earley set \Ves{i},
and that $0 \leq \var{x} < \var{c}$,
where \var{c} is a constant of reasonable size,
then a search can be made in \Oc{} time,
using a data structure called a PSL.
Data structures identical to or very similar to PSL's are
briefly outlined in both
\cite[p. 97]{Earley1970} and
\cite[Vol. 1, pages 326-327]{AU1972}.
But neither source gives them a name.
The term PSL
(``per-Earley set list'')
is new
with Marpa.

A PSL is a fixed-length array of
integers, indexed by an integer,
and kept as part of each Earley set.
While \Marpa{} is building a new Earley set,
\Ves{j},
the PSL for every previous Earley set, \Vloc{i},
tracks the Earley items in \Ves{j} that have \Vloc{i}
as their origin.
The maximum number of Earley items that must be tracked
in each PSL is
the number of dotted rules,
\Vsize{\Cdr},
which is a constant of reasonable size
that depends on \Cg{}.

It would take more than \Oc{} time
to clear and rebuild the PSL's each time
that a new Earley set is started.
This overhead is avoided by ``time-stamping'' each PSL
entry with the Earley set
that was current when that PSL
entry was last updated.

As before,
where \Ves{i} is an Earley set,
let \Vloc{i} be its location,
and vice versa.
\Vloc{i} is an integer which is
assigned as Earley sets are created.
We can easily assign a zero-based numbering
to the dotted rules of the grammar,
call it $\ID{\Vdr{x}}$,
and this can be used as the integer ID of a dotted rule.
Let $\PSL{\Ves{x}}{\var{y}}$
be the entry for integer \var{y} in the PSL in
the Earley set at \Vloc{x}.

Consider the case where Marpa is building \Ves{j}
and wants to check whether Earley item \Veim{x} is new,
where $\Veim{x} = [ \Vdr{x}, \Vorig{x} ]$.
To check if \Veim{x} is new,
Marpa checks
\begin{equation*}
\var{time-stamp} = \PSL{\Ves{x}}{\ID{\Vdr{x}}}
\end{equation*}
If the entry has never been used,
we assume that $\var{time-stamp} = \undefined$.
If $\var{time-stamp} \ne \undefined \land \var{time-stamp} = \Vloc{j}$,
then \Veim{x} is not new,
and will not be added to the Earley set.

If $\Vloc{p} = \undefined \lor \var{time-stamp} \ne \Vloc{j}$,
then \Veim{x} is new.
\Veim{x} is added to the Earley set,
and a new time-stamp is set, as follow:
\begin{equation*}
\PSL{\Ves{x}}{\ID{\Vdr{x}}} \gets \Vloc{j}.
\end{equation*}

\section{Complexity summary}

For convenience, we summarize
the complexity results
of this section here,
as theorems.

\begin{theorem}
\label{t:added-eim-charge}
The time and space charged to an Earley item
which is actually added to the Earley sets
is \Oc.
\end{theorem}

\begin{proof}
The theorem follows from collecting the results
in the complexity discussions of this section.
\end{proof}

\begin{theorem}
\label{t:dup-eim-time}
The time charged to an attempt
to add a duplicate Earley item to the Earley sets
is \Oc.
\end{theorem}

\begin{proof}
The theorem follows from collecting the results
in the complexity discussions of this section.
\end{proof}

For evaluation purposes, \Marpa{} adds a link to
each EIM that records each attempt to
add that EIM,
whether originally or as a duplicate.
Traditionally, complexity results treat parsers
as recognizers, and such costs are ignored.
This will be an issue when the space complexity
for unambiguous grammars is considered.

\begin{theorem}
\label{t:dup-eim-space}
The space charged to an attempt
to add a duplicate Earley item to the Earley sets
is \Oc{} if links are included,
zero otherwise.
\end{theorem}

\begin{proof}
The theorem follows from collecting the results
in the complexity discussions of this section.
\end{proof}

\begin{theorem}
\label{t:prediction-time}
No space or time is charged to predicted Earley items,
or to attempts to add predicted Earley items.
\end{theorem}

\begin{proof}
As noted in Section \ref{p:add-eim-set},
the time and space used by predicted Earley items
and attempts to add them is charged elsewhere.
\end{proof}

\chapter{Correctness}
\label{ch:correctness}

We are now is a position to show that Marpa is correct.
\begin{theorem}
\label{t:marpa-is-correct}
\textup{ $\myL{\Marpa,\Cg} = \myL{\Cg}$ }
\end{theorem}

\begin{proof}
We proceed by induction on the Earley sets.
As the basis of the induction,
we note that
Algorithm \ref{alg:top}
at line \ref{line:top-20},
calls Algorithm \ref{alg:initial}.
By Theorem
\ref{t:initial-op-correct},
after
line \ref{line:top-20},
Earley set 0 is correct.

As the step of the induction,
we assume that we
are
at line \ref{line:top-30}
of
Algorithm \ref{alg:top},
about to process
the Earley set at \Vloc{i}.
We assume for the induction step
that
\begin{equation}
\label{eq:marpa-is-correct-20}
\forall \, \Vloc{h} \mid 0 \le \var{h} < \Vloc{i} \implies \text{\Vtable{h} is correct.}
\end{equation}

Line
\ref{line:top-33}
executes the read pass for Earley set \var{i}.
From
\eqref{eq:marpa-is-correct-20}
and Theorem
\ref{t:read-op-correct},
we see that,
after the execution
of line
\ref{line:top-33},
\begin{equation}
\label{eq:marpa-is-correct-40}
\text{the ethereal closure of the read EIM's at \Vloc{i} is correct.}
\end{equation}

Next,
line \ref{line:top-40}
executes the reduction pass for Earley set \var{i}.
From
\eqref{eq:marpa-is-correct-20},
\eqref{eq:marpa-is-correct-40}
and Theorem
\ref{t:reduction-op-correct},
we see that,
after the execution
of line
\ref{line:top-40},
\begin{equation}
\label{eq:marpa-is-correct-50}
\text{the ethereal closure of the reduced EIM's at \Vloc{i} is correct.}
\end{equation}

By assumption for the step,
Earley set \Vloc{i} cannot be Earley set 0,
so we know vacously that
\begin{equation}
\label{eq:marpa-is-correct-53}
\text{the ethereal closure of start EIM's at \Vloc{i} is correct.}
\end{equation}
From
\eqref{eq:marpa-is-correct-40},
\eqref{eq:marpa-is-correct-50}
and
\eqref{eq:marpa-is-correct-53}
we see that the ethereal closure of
the set of telluric EIM's at \Vloc{i} is correct.
By theorem
\ref{t:ethereal-closure-op-correct}
we know that the set of ethereal EIM's at \Vloc{i}
is correct.
Since every EIM is either telluric or ethereal,
we know that Earley set \Vloc{i} is correct.
This shows the step of the induction,
and the induction.

We know from the induction
and line \ref{line:top-30}
of Algorithm \ref{alg:top},
that the Earley set at \loc{\Vsize{w}}
is correct.
Therefore,
by Theorem
\ref{t:algorithm-correct},
it contains
the accept EIM if and only if
\Cw{} is in the language of the grammar,
$\var{L}(\Cg)$, so that
\begin{equation}
\label{eq:marpa-is-correct-60}
\Veim{accept} \in \Vtables{Marpa} \equiv \Cw \in \var{L}(\Cg).
\end{equation}

From \eqref{eq:def-implementation-accepts-10},
we know that an algorithm accepts an input if
and only if the accept EIM is in its tables.
By Theorem \ref{t:accept-eim-not-memoized},
we know that the accept EIM is not memoized.
Using
\eqref{eq:def-implementation-accepts-10} and
\eqref{eq:marpa-is-correct-60}, we have
\begin{equation*}
\Cw{} \in \var{L}(\alg{Marpa}, \Cg) \equiv \Cw \in \var{L}(\Cg).
\end{equation*}
\end{proof}

\chapter{Complexity results}
\label{ch:complexity}

\section{Nulling symbols}
\label{s:nulling}

Recall that Marpa grammars,
without loss of generality,
contain neither empty rules or
properly nullable symbols.
This corresponds directly
to a grammar rewrite in the \Marpa{} implementation,
and its reversal during \Marpa's evaluation phase.
For the correctness and complexity proofs in this monograph,
we assume an additional rewrite,
this time to eliminate nulling symbols.

Elimination of nulling symbols is also
without loss of generality, as can be seen
if we assume that a history
of the rewrite is kept,
and that the rewrite is reversed
after the parse.
Clearly, whether a grammar \Cg{} accepts
an input \Cw{}
will not depend on the nulling symbols in its rules.

In its implementation,
\Marpa{} does not directly rewrite the grammar
to eliminate nulling symbols.
But nulling symbols are ignored in
creating the dotted rules,
and must be restored during \Marpa's evaluation phase,
so that the implementation and
this simplification for theory purposes
track each other closely.

\section{Complexity of each Earley item}

For the complexity proofs,
we consider only Marpa grammars without nulling
symbols.
We showed that this rewrite
is without loss of generality
in Section \ref{s:nulling},
when we examined correctness.
For complexity we must also show that
the rewrite and its reversal can be done
in amortized \Oc{} time and space
per Earley item.

\begin{lemma}
\ltitle{Nulling rewrite}
\label{l:nulling-rewrite}
All time and space required
to rewrite the grammar to eliminate nulling
symbols, and to restore those rules afterwards
in the Earley sets,
can be allocated
to the Earley items
in such a way that each Earley item
requires \Oc{} time and space.
\end{lemma}

\begin{proof}
The time and space used in the rewrite is a constant
that depends on the grammar,
and is charged to the parse.
The reversal of the rewrite can be
done in a loop over the Earley items,
which will have time and space costs
per Earley item,
plus a fixed overhead.
The fixed overhead is \Oc{}
and is charged to the parse.
The time and space per Earley item
is \Oc{}
because the number of
rules into which another rule must be rewritten,
and therefore the number of Earley items
into which another Earley item must be rewritten,
is a constant that depends
on the grammar.
\end{proof}

\begin{theorem}\label{t:O1-time-per-eim}
All time in \Marpa{} can be allocated
to the Earley items,
in such a way that each Earley item,
and each attempt to
add a duplicate Earley item,
requires \Oc{} time.
\end{theorem}

\begin{theorem}\label{t:O1-space-per-eim}
All space in \Marpa{} can be allocated
to the Earley items,
in such a way that each Earley item
requires \Oc{} space and,
if links are not considered,
each attempt to add a duplicate
Earley item adds no additional space.
\end{theorem}

\begin{theorem}\label{t:O1-links-per-eim}
If links are considered,
all space in \Marpa{} can be allocated
to the Earley items
in such a way that each Earley item
and each attempt to
add a duplicate Earley item
requires \Oc{} space.
\end{theorem}

\begin{proof}[Proof of Theorems
\ref{t:O1-time-per-eim},
\ref{t:O1-space-per-eim},
and \ref{t:O1-links-per-eim}]
These theorems follows from the observations
in Section \ref{ch:pseudocode}
and from Lemma \ref{l:nulling-rewrite}.
\end{proof}

The same complexity results apply to \Marpa{} as to \Leo,
and the proofs are very similar.
\Leo's complexity results~\cite{Leo1991}
are based on charging
resource to Earley items,
as were the results
in Earley's paper~\cite{Earley1970}.

Earley~\cite{Earley1970} shows that,
for unambiguous grammars,
every attempt to add
an Earley item will actually add one.
In other words, there will be no attempts to
add duplicate Earley items.
Earley's proof shows that for each attempt
to add a duplicate,
the causation must be different ---
that the EIM's causing the attempt
differ in either their dotted
rules or their origin.
Multiple causations for an Earley item
would mean multiple derivations
for the sentential form that it represents.
That in turn would mean that
the grammar is ambiguous,
contrary to assumption.

As a reminder,
we follow tradition by
stating complexity results in terms of \var{n},
setting $\var{n} = \Vsize{\Cw}$,
where \Vsize{\Cw}
is the length of the input.

\begin{theorem}
\label{t:unambig-reduction-tries}
For an unambiguous grammar,
the number of attempts to add reduction EIM's
will be \On[2].
\end{theorem}

\begin{proof}
Let \Ves{j} be an Earley set for which we
are counting attempts.
\Marpa{} attempts to add an Earley reduction result
to \Ves{j}
once for every pair of matching causes,
\begin{equation}
\label{eq:unambig-reduction-tries-1}
\text{$[\Veim{down}, \Veim{up}]$,
  such that
  $\Current{\Veim{up}} = \Ves{j}$.
}
\end{equation}

Let \var{j-tries} be the number of attempts to
add reduction EIM's to \Ves{j}.
The matching pair in
each of the \var{j-tries} attempts has an effect EIM,
and that effect EIM
either duplicates an EIM already in \Ves{j}
or else adds a new Earley item to \Ves{j}.
The number of Earley items added to \Ves{j}
is at most $\bigsize{\EVtable{\Marpa}{j}} = \order{\var{j}}$
\tref{t:es-count}.
Therefore,
\begin{align}
\label{eq:unambig-reduction-tries-2}
\myparbox{%
the \var{j-tries}
reduction attempts add at most
\order{\var{j}} Earley items
to \Ves{j}, so that
} \\
\label{eq:unambig-reduction-tries-4}
\myparbox{%
either
$\var{j-tries} \le \bigsize{\EVtable{\Marpa}{j}}$,
or an attempted reduction tries to add a duplicate Earley item
\becuz{}
\eqref{eq:unambig-reduction-tries-2}.
}
\intertext{%
We assume for a reductio that
an attempted reduction tries to add a duplicate Earley item,
call if \Veim{eff}.
That is,
}
\label{eq:unambig-reduction-tries-6}
\tag{RAA}
\myparbox{%
two attempts are made to add \Veim{eff}
to \Ves{j};
} \\
\label{eq:unambig-reduction-tries-6b}
\myparbox{%
$\var{pair1} = [\Veim{down1}, \Veim{up1}]$
is the first attempt
\becuz{}
\eqref{eq:unambig-reduction-tries-6}, WLOG;
} \\
\label{eq:unambig-reduction-tries-6d}
\myparbox{%
$\var{pair2} = [\Veim{down2}, \Veim{up2}]$
is the second attempt
\becuz{} \eqref{eq:unambig-reduction-tries-6}, WLOG; and
} \\
\label{eq:unambig-reduction-tries-6f}
\myparbox{%
$\var{pair1} \neq \var{pair2}$
\becuz{} \eqref{eq:unambig-reduction-tries-6}, WLOG.
} \\
\label{eq:unambig-reduction-tries-8}
\myparbox{%
$\Veim{down1} \neq \Veim{down2}$
or
$\Veim{up1} \neq \Veim{up2}$
\becuz{}
\eqref{eq:unambig-reduction-tries-6b},
\eqref{eq:unambig-reduction-tries-6d},
\eqref{eq:unambig-reduction-tries-6f}.
}
\intertext{%
As an aside,
recall that duplicate attempts to add Earley items are ignored,
so that exactly one of the attempts of
\eqref{eq:unambig-reduction-tries-6} will succeed in adding
an Earley item.
}
\label{eq:unambig-reduction-tries-10}
\myparbox{%
$\Veim{down1} \neq \Veim{down2} \implies$
\Cg{} is ambiguous
\becuz{}
\tref{t:multi-down-cause-ambiguous}.
} \\
\label{eq:unambig-reduction-tries-12}
\myparbox{%
$\Veim{up1} \neq \Veim{up2} \implies$
\Cg{} is ambiguous
\becuz{}
\tref{t:multi-up-cause-ambiguous}.
} \\
\label{eq:unambig-reduction-tries-18}
\myparbox{%
\Cg{} is ambiguous
\becuz{}
\eqref{eq:unambig-reduction-tries-8},
\eqref{eq:unambig-reduction-tries-10},
\eqref{eq:unambig-reduction-tries-12}.
} \\
\label{eq:unambig-reduction-tries-20}
\myparbox{%
\Cg{} is not ambiguous, by assumption for the theorem, which
with 
\eqref{eq:unambig-reduction-tries-18} shows the reductio.
} \\
\label{eq:unambig-reduction-tries-22}
\myparbox{%
no reduction attempt tries to
add a duplicate Earley item
to \Ves{j}
\becuz{}
\eqref{eq:unambig-reduction-tries-20},
reductio starting at
\eqref{eq:unambig-reduction-tries-6}.
} \\
\label{eq:unambig-reduction-tries-24}
\myparbox{%
$\var{j-tries} \le \bigsize{\EVtable{\Marpa}{j}}$.
\eqref{eq:unambig-reduction-tries-4},
\eqref{eq:unambig-reduction-tries-22}.
} \\
\label{eq:unambig-reduction-tries-26}
\myparbox{%
$\var{j-tries} = \order{\var{j}}$
\becuz{}
\eqref{eq:unambig-reduction-tries-24},
\tref{t:es-count}.
}
\end{align}

Using
\eqref{eq:unambig-reduction-tries-26},
and summing over the Earley sets from Earley
set 0 to Earley set n,
we see that
\begin{equation}
\label{eq:unambig-reduction-tries-28}
\var{reduction-tries} \le \sum\limits_{\displaystyle \var{j}=0}^{\displaystyle \var{n}} \order{\var{j}}
= \On[2].\qedhere
\end{equation}
\end{proof}

\begin{theorem}
\label{t:start-tries}
In a Marpa grammar,
the number of attempts to add start EIM's
will be \Oc.
\end{theorem}

\begin{proof}
Let
\var{start-tries} be the number of attempts to add the start EIM
to the Earley sets.
It is clear from the pseudocode
that there will be exactly one attempt to add a start EIM
to the Earley sets,
an attempt that will be made in Earley set 0.
Therefore,
\begin{equation}
\label{eq:tries-15}
\var{start-tries} = 1 = \Oc.\qedhere
\end{equation}
\end{proof}

\begin{theorem}
\label{t:read-tries}
In a Marpa grammar,
the number of attempts to add read EIM's
will be \order{\var{z}}.
\end{theorem}

\begin{proof}
Consider one Earley set, call it \Ves{j}.
Let
\var{read-tries} be the number of attempts to add read EIM's
to the Earley sets.
In the worst case,
when adding Earley items to \Ves{j},
Marpa attempts a read operation
once for every EIM in the Earley set
at \Vdecr{j}.
Therefore, the number of attempts
to add read EIM's to Earley set \Ves{j}
must be less than equal to \bigsize{\Etable{\Vdecr{j}}}.
\[
\bigsize{\Etable{\Vdecr{j}}} = \order{\Vdecr{i}}
\becuz \tref{t:es-count}.
\]
Summing over the Earley sets from 0 to \var{n},
the number of attempts to add read items will be
\begin{equation*}
\var{read-tries} \le \sum\limits_{i=1}^{n}{ \order{\Vdecr{i}} } = \On[2].\qedhere
\end{equation*}
\end{proof}

\begin{theorem}
\label{t:ethereal-tries}
In a Marpa grammar,
the number of attempts to add ethereal EIM's
will be \On[2].
\end{theorem}

\begin{proof}
From the pseudo-code we see that
ethereal EIM's are only added if their telluric base EIM
is new.
Therefore,
there will never be duplicate attempts
to add ethereal EIM's for the same telluric base EIM.

The ethereal EIM's which might be added for a given
telluric base are predictions and null-scans.
The number of null-scans is limited by the RHS length,
call it \var{rhs-max},
of the longest rule in \Cg{}.
The number of predictions is limited by the number of rules
in \Cg{}, \Vsize{\Crules}.
Therefore,
the number of ethereal add attempts is at most
$\var{rhs-max} + \Vsize{\Crules}$ times the number of EIM's
in the Earley tables:
\begin{align}
\label{eq:ethereal-tries-10}
&
\var{ethereal-tries} \le
\left(
\begin{gathered}
(\var{rhs-max} + \Vsize{\Crules}) \\
\times \sum\limits_{\var{i}=1}^{\var{n}}{ \bigsize{\Etable{\var{i}}} }
\end{gathered}
\right).
\\
\label{eq:ethereal-tries-12}
& \text{%
\var{rhs-max} and
\Vsize{\Crules} are constants that depend on \Cg{}.
} \\
\label{eq:ethereal-tries-14}
& \var{ethereal-tries} = \Oc \times 
\sum\limits_{\var{i}=1}^{\var{n}}{ \bigsize{\Etable{\var{i}}} }
\becuz
\eqref{eq:ethereal-tries-10},
\eqref{eq:ethereal-tries-12}.
\\
\label{eq:ethereal-tries-16}
& \var{ethereal-tries} = \Oc \times 
\sum\limits_{\var{i}=1}^{\var{n}}{ \order{\var{i}} }
\becuz
\eqref{eq:ethereal-tries-14},
\tref{t:es-count}.
\\
\notag
& \var{ethereal-tries} = \On[2]
\becuz
\eqref{eq:ethereal-tries-16}.
\qedhere
\end{align}
\end{proof}

\begin{theorem}
\label{t:leo-tries}
In a Marpa grammar,
the number of attempts to add Leo memos
will be \On[2].
\end{theorem}

\begin{proof}
For Leo reduction,
we note that by its definition,
duplicate attempts at Leo reduction cannot occur.
From the pseudo-code of Sections \ref{p:reduce-one-up-cause}
and \ref{p:leo-op},
we know there will be at most one Leo reduction for
every Earley item in the Earley tables:
\begin{align}
\label{eq:leo-tries-10}
& \var{leo-tries} =
\sum\limits_{\var{i}=1}^{\var{n}}{
\bigsize{\Etable{\var{i}}}
}.
\\
\label{eq:leo-tries-12}
& \forall \; \var{i} : \bigsize{\Etable{\var{i}}} = \order{\var{i}}
\becuz \tref{t:es-count}.
\\
\notag
& \var{leo-tries} =
\sum\limits_{\var{i}=1}^{\var{n}}{
\order{\var{i}}
} = \On[2] \becuz
\eqref{eq:leo-tries-10},
\eqref{eq:leo-tries-12}
.\qedhere
\end{align}
\end{proof}

\begin{theorem}
\label{t:tries}
In an unambiguous Marpa grammar,
the number of attempts to add
Leo memos and Earley items will be
\[\var{tries} = \On[2].\]
\end{theorem}

\begin{proof}
For the purpose of this proof,
we call each each attempt to add a Leo memo or an Earley item,
a ``try''.
We proceed by cases, and we classify tries as follows:
\begin{itemize}
\item
EIM tries
\begin{itemize}
\item
Telluric tries
\begin{itemize}
\item
Start tries: \Oc{} \becuz{} \tref{t:start-tries}.
\item
Read tries: \On[2] \becuz{} \tref{t:read-tries}.
\item
Reduction tries: \On[2] \becuz{} \tref{t:unambig-reduction-tries}.
\end{itemize}
\item
Ethereal tries: \On[2] \becuz{} \tref{t:ethereal-tries}.
\end{itemize}
\item
Leo tries: \On[2] \becuz{} \tref{t:leo-tries}.
\end{itemize}

Summing the above,
\begin{align*}
\label{eq:tries-5}
\var{tries} & = \Oc + \On[2] + \On[2] + \On[2] + \On[2] \\*
    & = \On[2] \qedhere
\end{align*}
\end{proof}

\begin{theorem}
\label{t:leo-right-recursion}
Either
a right derivation has a step
that uses a right recursive rule,
or it has length is at most \var{c},
where \var{c} is a constant which depends
on the grammar.
\end{theorem}

\begin{proof}
Let the constant \var{c} be the number
of symbols.
Assume, for a reductio, that a right derivation
expands to a
Leo sequence of length
$\var{c}+1$, but that none of its steps uses a right recursive rule.

Because it is of length $\var{c}+1$,
the same symbol must appear twice as the rightmost symbol of
a derivation step.
(Since for the purposes of these
complexity results we ignore nulling symbols,
the rightmost symbol of a string will also be its rightmost
telluric symbol.)
So part of the rightmost derivation must take the form
\begin{equation*}
\Vstr{earlier-prefix} \cat \Vsym{A} \deplus \Vstr{later-prefix} \cat \Vsym{A}.
\end{equation*}
But the first step of this derivation sequence must use a rule of the
form
\begin{equation*}
\Vsym{A} \de \Vstr{rhs-prefix} \cat \Vsym{rightmost},
\end{equation*}
where $\Vsym{rightmost} \deplus \Vsym{A}$.
Such a rule is right recursive by definition.
This is contrary to the assumption for the reductio.
We therefore conclude that the length of a right derivation
must be less than or equal to \var{c},
unless at least one step of that derivation uses a right recursive rule.
\end{proof}

TODO: Account for effect of not-memoizing at location 0.

\begin{theorem}
For every LR-regular grammar,
\Marpa{} runs in $\On{}$ time and space.
\end{theorem}

\begin{proof}
By Theorem 4.6 in~\cite[p. 173]{Leo1991},
the number of Earley items produced by
\Leo{} when parsing input \Cw{} with an LR-regular grammar \Cg{} is
\begin{equation*}
\order{\Vsize{\Cw}} = \order{\var{n}}.
\end{equation*}
\Marpa{} may produce more Earley items than \Leo{}
because
\Marpa{} does not apply Leo memoization to Leo sequences
which do not contain right recursion.

By the definition of an EIM,
and the construction of a Leo sequence,
it can be seen that a Leo sequence
corresponds step-for-step with a
right derivation.
It can therefore be seen that
the number of EIM's in the Leo sequence
and the number of right derivation steps
in its corresponding right derivation
will be the same.

Consider one EIM that is memoized in \Leo{}.
If not memoized because it is not a right recursion,
this EIM will be expanded to a sequence
of EIM's.
How long will this sequence of non-memoized EIM's
be, if we still continue to memoize EIM's
which correspond to right recursive rules?
The EIM sequence, which was formerly a memoized Leo sequence,
will correspond to a right
derivation that does not include
any steps that use right recursive rules.
By Theorem \ref{t:leo-right-recursion},
such a
right derivation can be
of length at most \var{c1},
where \var{c1} is a constant that depends on \Cg{}.
As noted, this right derivation has
the same length as its corresponding EIM sequence,
so that each EIM not memoized in \Marpa{} will expand
to at most \var{c1} EIM's.

The number of EIM's per Earley set
for an LR-regular grammar in a \Marpa{} parse
is less than
\begin{equation*}
    \var{c1} \times \order{\var{n}} = \order{\var{n}}.
\end{equation*}

LR-regular grammars are unambiguous, so that
by Theorem \ref{t:tries},
the number of attempts that \Marpa{} will make to add
EIM's is less than or equal to
\var{c2} times the number of EIM's,
where \var{c2} is a constant that depends on \Cg{}.
Therefore,
by Theorems \ref{t:O1-time-per-eim}
and \ref{t:O1-links-per-eim},
the time and space complexity of \Marpa{} for LR-regular
grammars is
\begin{equation*}
    \var{c2} \times \order{\var{n}}
    = \order{\var{n}}.\qedhere
\end{equation*}
\end{proof}

\begin{theorem}
\label{t:eim-count}
For a context-free grammar,
\begin{equation*}
\textup{
    $\Rtablesize{\Marpa} = \order{\var{n}^2}$.
}
\end{equation*}
\end{theorem}

\begin{proof}
By Theorem \ref{t:es-count},
the size of the Earley set at \Vloc{i}
is $\order{\var{i}}$.
Summing over the length of the input,
$\Vsize{\Cw} = \var{n}$,
the number of EIM's in all of \Marpa's Earley sets
is
\begin{equation*}
\sum\limits_{\Vloc{i}=0}^{\var{n}}{\order{\var{i}}}
= \order{\var{n}^2}.\qedhere
\end{equation*}
\end{proof}

\begin{theorem}
\label{t:reduction-tries}
For a Marpa grammar,
the number of attempts to add reduction EIM's
will be \On[3].
\end{theorem}

\begin{proof}
Let \var{tries} be the number of attempts to add reduction EIM's to
the Earley tables.
Let \var{pairs} be the set of matching causes in the Earley tables.
\Marpa{} attempts to add an Earley reduction result
to the Earley tables
once for every pair of matching causes,
that is, once for every
\begin{equation}
\label{eq:reduction-tries-10}
[\Veim{down}, \Veim{up}] \in \var{pairs}.
\end{equation}
Therefore, if \bigsize{\var{pairs}} is the number of matching cause pairs
in the Earley tables,
then
\[
\bigsize{\var{pairs}} = \var{tries}.
\]

Recall that the first element of each pair of matching causes
is its top-down cause,
and the second element of each pair is its bottom-up cause.
For brevity, we will call the top-down cause of a matching pair
of causes, its ``top-down cause'',
and we will call the bottom-up cause of a matching pair of
cause, its ``bottom-up cause''.
We can see that
\begin{equation}
\label{eq:reduction-tries-15}
    \bigsize{\var{pairs}} \le \var{up-count} \times \var{downs-per-up},
\end{equation}
where
\var{up-count} is the number of EIM's which are
bottom-up causes,
and \var{downs-per-up} is the maximum number of 
top-down causes for any bottom-up cause, that is
\[
   \var{downs-per-up} =
   \max_{\Veim{up}} \left|
     \begin{gathered}
     \Veim{down} \; \text{such that} \\
     [\Veim{down}, \Veim{up}] \\
     \in \var{pairs}
     \end{gathered}
   \right|.
\]

We first seek an upper bound for \var{downs-per-up}.
We know that
\begin{align}
\label{eq:reduction-tries-25}
&
\begin{gathered}
\forall \; \Veim{down}, \Veim{up} :
[\Veim{down}, \Veim{up}] \in \var{pairs}
\\
\implies
\Right{\Veim{down}} = \Left{\Veim{up1}}
\\
\becuz \dref[matching causes]{def:matching-causes}.
\end{gathered}
\intertext{%
Let \var{ups} be the set of bottom-up causes in \var{pairs}.
Because every top-down cause must be in 
the Earley set which is the origin of its bottom-up cause,
we see that
}
\label{eq:reduction-tries-27}
&
\var{downs-per-up} = \max_{\Veim{up} \in \var{ups}}
  \; \bigsize{\Etable{\Left{\Veim{up}}}}
\becuz \eqref{eq:reduction-tries-25}.
\\
\label{eq:reduction-tries-29}
&
\var{downs-per-up} = \max_{\Veim{up} \in \var{ups}}
  \; \order{\Left{\Veim{up}}}
\becuz{} \eqref{eq:reduction-tries-27}.
\\
\label{eq:reduction-tries-31}
& \myparbox{
$\forall \; \Veim{up} :
  (\Veim{up} \in \var{ups}) \implies
  \Left{\Veim{up}} \le \var{n}$,
because every location in the Earley tables
must be less than or equal to
$\Vsize{\Cw} = \var{n}$
\tref{t:es-count}.
}
\intertext{%
We are now in a position to state an
upper bound for \var{downs-per-up}:
}
\label{eq:reduction-tries-33}
&
\var{downs-per-up} = \On[]
\becuz \eqref{eq:reduction-tries-29},
\eqref{eq:reduction-tries-31}.
\intertext{%
As an upper bound, we allow
every EIM to be an bottom-up cause so that
}
\label{eq:reduction-tries-35}
& \var{up-count} =
\sum\limits_{\var{i}=1}^{\var{n}}{
\bigsize{\Etable{\var{i}}}
}.
\\
\label{eq:reduction-tries-37}
& \forall \; \var{i} : \bigsize{\Etable{\var{i}}} = \order{\var{i}}
\becuz \tref{t:es-count}.
\\
\label{eq:reduction-tries-39}
& \var{up-count} =
\sum\limits_{\var{i}=1}^{\var{n}}{
\order{\var{i}}
} = \On[2] \becuz
\eqref{eq:reduction-tries-35},
\eqref{eq:reduction-tries-37}.
\\
\notag
& \bigsize{\var{pairs}} = \On[3]
\becuz
\eqref{eq:reduction-tries-15},
\eqref{eq:reduction-tries-33},
\eqref{eq:reduction-tries-39}
.\qedhere
\end{align}
\end{proof}

\begin{theorem}
\label{t:ambiguous-tries}
For a context-free grammar,
the number of attempts by \Marpa{} to add
Earley items is \On[3].
\end{theorem}

\begin{proof}
For the purpose of this proof,
we call each each attempt to add a Leo memo or an Earley item,
a ``try''.
We proceed by cases, and we classify tries as follows:
\begin{itemize}
\item
EIM tries
\begin{itemize}
\item
Telluric tries
\begin{itemize}
\item
Start tries: \Oc{} \becuz{} \tref{t:start-tries}.
\item
Read tries: \On[2] \becuz{} \tref{t:read-tries}.
\item
Reduction tries: \On[3] \becuz{} \tref{t:reduction-tries}.
\end{itemize}
\item
Ethereal tries: \On[2] \becuz{} \tref{t:ethereal-tries}.
\end{itemize}
\item
Leo tries: \On[2] \becuz{} \tref{t:leo-tries}.
\end{itemize}

Summing the above,
\begin{align*}
\label{eq:tries-5}
\var{tries} & = \Oc + \On[2] + \On[3] + \On[2] + \On[2] \\*
    & = \On[3] \qedhere
\end{align*}

TODO: finish
\end{proof}

\begin{theorem}
For every unambiguous grammar,
\Marpa{} runs in $\order{n^2}$ time and space.
\end{theorem}

\begin{proof}
By assumption, \Cg{} is unambiguous, so that
by Theorem \ref{t:tries},
and Theorem \ref{t:eim-count},
the number of attempts that \Marpa{} will make to add
EIM's is
\begin{equation*}
\var{c} \times \order{\var{n}^2},
\end{equation*}
where \var{c} is a constant that depends on \Cg{}.
Therefore,
by Theorems \ref{t:O1-time-per-eim}
and \ref{t:O1-links-per-eim},
the time and space complexity of \Marpa{}
for unambiguous grammars is \order{\var{n}^2}.
\end{proof}

\begin{FlushLeft}
\begin{theorem}
For every context-free grammar,
\Marpa{} runs in $\order{\var{n}^3}$ time.
\end{theorem}
\end{FlushLeft}

\begin{proof}
By Theorem \ref{t:O1-time-per-eim},
and Theorem \ref{t:ambiguous-tries}.
\end{proof}

\begin{FlushLeft}
\begin{theorem}\label{t:cfg-space}
For every context-free grammar,
\Marpa{} runs in $\order{\var{n}^2}$ space,
if it does not track links.
\end{theorem}
\end{FlushLeft}

\begin{proof}
By Theorem \ref{t:O1-space-per-eim}
and Theorem \ref{t:eim-count}.
\end{proof}

Traditionally only the space result stated for a parsing algorithm
is that
without links, as in \ref{t:cfg-space}.
This is sufficiently relevant
if the parser is only used as a recognizer.
In practice, however,
algorithms like \Marpa{}
are typically used in anticipation
of an evaluation phase,
for which links are necessary.

\begin{FlushLeft}
\begin{theorem}
For every context-free grammar,
\Marpa{} runs in $\order{\var{n}^3}$ space,
including the space for tracking links.
\end{theorem}
\end{FlushLeft}

\begin{proof}
By Theorem \ref{t:O1-links-per-eim},
and Theorem \ref{t:ambiguous-tries}.
\end{proof}

\chapter{Acknowledgements}
\label{ch:Acknowledgements}

Ruslan Shvedov%
\index{recce-general}{Shvedov, Ruslan}
and
Ruslan Zakirov%
\index{recce-general}{Zakirov, Ruslan}
made many useful suggestions
that are incorporated in this paper.
Many members of the Marpa community
have helped me in many ways,
and it is risky
to single out one of them.
But Ron Savage%
\index{recce-general}{Savage, Ron}
has been unstinting in
his support.

\bibliographystyle{plain}

\begin{thebibliography}{10}
\RaggedRight

\bibitem{AU1972}
Alfred H.~Aho and Jeffrey D.~Ullman.
\newblock The Theory of Parsing, Translation, and Compiling
\newblock Prentice-Hall, Englewood Cliff, N.J., 1972.

\bibitem{AH2002}
John~Aycock and R.~Nigel~Horspool.
\newblock Practical Earley Parsing
\newblock {\em The Computer Journal},
    Vol. 45, No. 6, 2002, pp. 620--630.

\bibitem{Culik1973}
{\v{C}}ulik, Karel and Cohen, Rina.
\newblock LR-Regular grammars—an extension of LR (k) grammars.
\newblock {\em Journal of Computer and System Sciences},
  Vol. 7, No. 1, 1973,
  pp. 66--96.

\bibitem{Earley1968}
J.~Earley.
\newblock An Efficient Context-Free Parsing Algorithm.
\newblock Ph.D. Thesis, Carnegie Mellon University, 1968

\bibitem{Earley1970}
J.~Earley.
\newblock An efficient context-free parsing algorithm.
\newblock {\em Communications of the Association for Computing Machinery},
  13(2):94--102, 1970.

\bibitem{GJ2008}
Dirk~Grune and Ceriel~J.H Jacobs.
\newblock {\em Parsing Techniques: A Practical Guide}.
\newblock Springer, Amsterdam, 2008.

\bibitem{ED1976}
Dijkstra,~Edsger~W.
\newblock {\em A discipline of programming}.
\newblock Prentice-Hall, Englewood Cliffs, N.J., 1976.

\bibitem{Irons}
Edgar~T.~Irons.
\newblock A syntax-directed compiler for ALGOL 60.
\newblock {\em Communications of the Association for Computing Machinery},
 4(1):51--55, Jan. 1961

\bibitem{Johnson}
Stephen~C. Johnson.
\newblock Yacc: Yet another compiler-compiler.
\newblock In {\em Unix Programmer's Manual Supplementary Documents 1}. 1986.

\bibitem{Marpa-2013}
Jeffrey~Kegler.
\newblock Marpa, a practical general parser: the recognizer.
\newblock \url{https://www.academia.edu/10341474/Marpa_A_practical_general_parser_the_recognizer}.

\bibitem{Marpa-R2}
Jeffrey~Kegler, 2015: Marpa-R2.
\newblock \url{http://search.cpan.org/dist/Marpa-R2/}.

\bibitem{Leo1991}
J.~M. I.~M. Leo.
\newblock A general context-free parsing algorithm running in linear time on
  every {LR($k$)} grammar without using lookahead.
\newblock {\em Theoretical Computer Science}, 82:165--176, 1991.

\bibitem{Wich2005}
Klaus Wich.
\newblock Ambiguity functions of context-free grammars and languages.
\newblock Ph.D. Thesis, Universit{\"a}t Stuttgart, 2005.
\newblock \url{http://elib.uni-stuttgart.de/opus/volltexte/2005/2282}

\end{thebibliography}

\clearpage
% \def\indexname{List of definitions, theorems and lemmas}
% uses .mst file
\printindex{recce-theorems}

\clearpage
% \def\indexname{List of algorithms}
% uses .mst file
\printindex{recce-algorithms}

% Merged into algorithms list
% \clearpage
% \def\indexname{Index of figures}
% \printindex{recce-figures}

\clearpage
% \def\indexname{Index of abbreviations and definitions}
% uses .mst file
\printindex{recce-definitions}

\clearpage
\def\indexname{Index of notation}
\printindex{recce-notation}

\clearpage
\def\indexname{General index}
\printindex{recce-general}

\tableofcontents

\end{document}