diff --git a/thys/Inductive_Inference/CONS_LIM.thy b/thys/Inductive_Inference/CONS_LIM.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/CONS_LIM.thy
@@ -0,0 +1,544 @@
+section \<open>CONS is a proper subset of LIM\label{s:cons_lim}\<close>
+
+theory CONS_LIM
+  imports Inductive_Inference_Basics
+begin
+
+text \<open>That there are classes in @{term "LIM - CONS"} was noted by
+Barzdin~\cite{b-iiafp-74,b-iiafp-77} and Blum and Blum~\cite{bb-tmtii-75}. It
+was proven by Wiehagen~\cite{w-lerfss-76} (see also Wiehagen and
+Zeugmann~\cite{wz-idmowle-94}). The proof uses this class:\<close>
+
+definition U_LIMCONS :: "partial1 set" ("U\<^bsub>LIM-CONS\<^esub>") where
+  "U\<^bsub>LIM-CONS\<^esub> \<equiv> {vs @ [j] \<odot> p| vs j p. j \<ge> 2 \<and> p \<in> \<R>\<^sub>0\<^sub>1 \<and> \<phi> j = vs @ [j] \<odot> p}"
+
+text \<open>Every function in @{term "U\<^bsub>LIM-CONS\<^esub>"} carries a Gödel number
+greater or equal two of itself, after which only zeros and ones occur.
+Thus, a strategy that always outputs the rightmost value greater or equal two
+in the given prefix will converge to this Gödel number.
+
+The next function searches an encoded list for the rightmost element
+greater or equal two.\<close>
+
+definition rmge2 :: partial1 where
+  "rmge2 e \<equiv>
+    if \<forall>i<e_length e. e_nth e i < 2 then Some 0
+    else Some (e_nth e (GREATEST i. i < e_length e \<and> e_nth e i \<ge> 2))"
+
+lemma rmge2:
+  assumes "xs = list_decode e"
+  shows "rmge2 e =
+   (if \<forall>i<length xs. xs ! i < 2 then Some 0
+    else Some (xs ! (GREATEST i. i < length xs \<and> xs ! i \<ge> 2)))"
+proof -
+  have "(i < e_length e \<and> e_nth e i \<ge> 2) = (i < length xs \<and> xs ! i \<ge> 2)" for i
+    using assms by simp
+  then have "(GREATEST i. i < e_length e \<and> e_nth e i \<ge> 2) =
+      (GREATEST i. i < length xs \<and> xs ! i \<ge> 2)"
+    by simp
+  moreover have "(\<forall>i<length xs. xs ! i < 2) = (\<forall>i<e_length e. e_nth e i < 2)"
+    using assms by simp
+  moreover have "(GREATEST i. i < length xs \<and> xs ! i \<ge> 2) < length xs" (is "Greatest ?P < _")
+      if "\<not> (\<forall>i<length xs. xs ! i < 2)"
+    using that GreatestI_ex_nat[of ?P] le_less_linear order.asym by blast
+  ultimately show ?thesis using rmge2_def assms by auto
+qed
+
+lemma rmge2_init:
+  "rmge2 (f \<triangleright> n) =
+   (if \<forall>i<Suc n. the (f i) < 2 then Some 0
+    else Some (the (f (GREATEST i. i < Suc n \<and> the (f i) \<ge> 2))))"
+proof -
+  let ?xs = "prefix f n"
+  have "f \<triangleright> n = list_encode ?xs" by (simp add: init_def)
+  moreover have "(\<forall>i<Suc n. the (f i) < 2) = (\<forall>i<length ?xs. ?xs ! i < 2)"
+    by simp
+  moreover have "(GREATEST i. i < Suc n \<and> the (f i) \<ge> 2) =
+      (GREATEST i. i < length ?xs \<and> ?xs ! i \<ge> 2)"
+    using length_prefix[of f n] prefix_nth[of _ n f] by metis
+  moreover have "(GREATEST i. i < Suc n \<and> the (f i) \<ge> 2) < Suc n"
+      if "\<not> (\<forall>i<Suc n. the (f i) < 2)"
+    using that GreatestI_ex_nat[of "\<lambda>i. i<Suc n \<and> the (f i) \<ge> 2" n] by fastforce
+  ultimately show ?thesis using rmge2 by auto
+qed
+
+corollary rmge2_init_total:
+  assumes "total1 f"
+  shows "rmge2 (f \<triangleright> n) =
+   (if \<forall>i<Suc n. the (f i) < 2 then Some 0
+    else f (GREATEST i. i < Suc n \<and> the (f i) \<ge> 2))"
+  using assms total1_def rmge2_init by auto
+
+lemma rmge2_in_R1: "rmge2 \<in> \<R>"
+proof -
+  define g where
+    "g = Cn 3 r_ifle [r_constn 2 2, Cn 3 r_nth [Id 3 2, Id 3 0], Cn 3 r_nth [Id 3 2, Id 3 0], Id 3 1]"
+  then have "recfn 3 g" by simp
+  then have g: "eval g [j, r, e] \<down>= (if 2 \<le> e_nth e j then e_nth e j else r)" for j r e
+    using g_def by simp
+
+  let ?h = "Pr 1 Z g"
+  have "recfn 2 ?h"
+    by (simp add: \<open>recfn 3 g\<close>)
+  have h: "eval ?h [j, e] =
+   (if \<forall>i<j. e_nth e i < 2 then Some 0
+    else Some (e_nth e (GREATEST i. i < j \<and> e_nth e i \<ge> 2)))" for j e
+  proof (induction j)
+    case 0
+    then show ?case using \<open>recfn 2 ?h\<close> by auto
+  next
+    case (Suc j)
+    then have "eval ?h [Suc j, e] = eval g [j, the (eval ?h [j, e]), e]"
+      using \<open>recfn 2 ?h\<close> by auto
+    then have *: "eval ?h [Suc j, e] \<down>=
+      (if 2 \<le> e_nth e j then e_nth e j
+       else if \<forall>i<j. e_nth e i < 2 then 0
+            else (e_nth e (GREATEST i. i < j \<and> e_nth e i \<ge> 2)))"
+      using g Suc by auto
+    show ?case
+    proof (cases "\<forall>i<Suc j. e_nth e i < 2")
+      case True
+      then show ?thesis using * by auto
+    next
+      case ex: False
+      show ?thesis
+      proof (cases "2 \<le> e_nth e j")
+        case True
+        then have "eval ?h [Suc j, e] \<down>= e_nth e j"
+          using * by simp
+        moreover have "(GREATEST i. i < Suc j \<and> e_nth e i \<ge> 2) = j"
+          using ex True Greatest_equality[of "\<lambda>i.  i < Suc j \<and> e_nth e i \<ge> 2"]
+          by simp
+        ultimately show ?thesis using ex by auto
+      next
+        case False
+        then have "\<exists>i<j. e_nth e i \<ge> 2"
+          using ex leI less_Suc_eq by blast
+        with * have "eval ?h [Suc j, e] \<down>= e_nth e (GREATEST i. i < j \<and> e_nth e i \<ge> 2)"
+          using False by (smt leD)
+        moreover have "(GREATEST i. i < Suc j \<and> e_nth e i \<ge> 2) =
+            (GREATEST i. i < j \<and> e_nth e i \<ge> 2)"
+          using False ex by (metis less_SucI less_Suc_eq less_antisym numeral_2_eq_2)
+        ultimately show ?thesis using ex by metis
+      qed
+    qed
+  qed
+
+  let ?hh = "Cn 1 ?h [Cn 1 r_length [Id 1 0], Id 1 0]"
+  have "recfn 1 ?hh"
+    using `recfn 2 ?h` by simp
+  with h have hh: "eval ?hh [e] \<down>=
+    (if \<forall>i<e_length e. e_nth e i < 2 then 0
+     else e_nth e (GREATEST i. i < e_length e \<and> e_nth e i \<ge> 2))" for e
+    by auto
+  then have "eval ?hh [e] = rmge2 e" for e
+    unfolding rmge2_def by auto
+  moreover have "total ?hh"
+    using hh totalI1 `recfn 1 ?hh` by simp
+  ultimately show ?thesis using `recfn 1 ?hh` by blast
+qed
+
+text \<open>The first part of the main result is that @{term "U\<^bsub>LIM-CONS\<^esub> \<in> LIM"}.\<close>
+
+lemma U_LIMCONS_in_Lim: "U\<^bsub>LIM-CONS\<^esub> \<in> LIM"
+proof -
+  have "U\<^bsub>LIM-CONS\<^esub> \<subseteq> \<R>"
+    unfolding U_LIMCONS_def using prepend_in_R1 RPred1_subseteq_R1 by blast
+  have "learn_lim \<phi> U\<^bsub>LIM-CONS\<^esub> rmge2"
+  proof (rule learn_limI)
+    show "environment \<phi> U\<^bsub>LIM-CONS\<^esub> rmge2"
+      using \<open>U_LIMCONS \<subseteq> \<R>\<close> phi_in_P2 rmge2_def rmge2_in_R1 by simp
+    show "\<exists>i. \<phi> i = f \<and> (\<forall>\<^sup>\<infinity>n. rmge2 (f \<triangleright> n) \<down>= i)" if "f \<in> U\<^bsub>LIM-CONS\<^esub>" for f
+    proof -
+      from that obtain vs j p where
+        j: "j \<ge> 2"
+        and p: "p \<in> \<R>\<^sub>0\<^sub>1"
+        and s: "\<phi> j = vs @ [j] \<odot> p"
+        and f: "f = vs @ [j] \<odot> p"
+        unfolding U_LIMCONS_def by auto
+      then have "\<phi> j = f" by simp
+      from that have "total1 f"
+        using `U\<^bsub>LIM-CONS\<^esub> \<subseteq> \<R>` R1_imp_total1 total1_def by auto
+      define n\<^sub>0 where "n\<^sub>0 = length vs"
+      have f_gr_n0: "f n \<down>= 0 \<or> f n \<down>= 1" if "n > n\<^sub>0" for n
+      proof -
+        have "f n = p (n - n\<^sub>0 - 1)"
+          using that n\<^sub>0_def f by simp
+        with RPred1_def p show ?thesis by auto
+      qed
+      have "rmge2 (f \<triangleright> n) \<down>= j" if "n \<ge> n\<^sub>0" for n
+      proof -
+        have n0_greatest: "(GREATEST i. i < Suc n \<and> the (f i) \<ge> 2) = n\<^sub>0"
+        proof (rule Greatest_equality)
+          show "n\<^sub>0 < Suc n \<and> the (f n\<^sub>0) \<ge> 2"
+            using n\<^sub>0_def f that j by simp
+          show "\<And>y. y < Suc n \<and> the (f y) \<ge> 2 \<Longrightarrow> y \<le> n\<^sub>0"
+          proof -
+            fix y assume "y < Suc n \<and> 2 \<le> the (f y)"
+            moreover have "p \<in> \<R> \<and> (\<forall>n. p n \<down>= 0 \<or> p n \<down>= 1)"
+              using RPred1_def p by blast
+            ultimately show "y \<le> n\<^sub>0"
+              using f_gr_n0
+              by (metis Suc_1 Suc_n_not_le_n Zero_neq_Suc le_less_linear le_zero_eq option.sel)
+          qed
+        qed
+        have "f n\<^sub>0 \<down>= j"
+          using n\<^sub>0_def f by simp
+        then have "\<not> (\<forall>i<Suc n. the (f i) < 2)"
+          using j that less_Suc_eq_le by auto
+        then have "rmge2 (f \<triangleright> n) = f (GREATEST i. i < Suc n \<and> the (f i) \<ge> 2)"
+          using rmge2_init_total `total1 f` by auto
+        with n0_greatest `f n\<^sub>0 \<down>= j` show ?thesis by simp
+      qed
+      with `\<phi> j = f` show ?thesis by auto
+    qed
+  qed
+  then show ?thesis using Lim_def by auto
+qed
+
+text \<open>The class @{term "U_LIMCONS"} is \emph{prefix-complete}, which
+means that every non-empty list is the prefix of some function in @{term
+"U_LIMCONS"}. To show this we use an auxiliary lemma: For every $f \in
+\mathcal{R}$ and $k \in \mathbb{N}$ the value of $f$ at $k$ can be replaced
+by a Gödel number of the function resulting from the replacement.\<close>
+
+lemma goedel_at:
+  fixes m :: nat and k :: nat
+  assumes "f \<in> \<R>"
+  shows "\<exists>n\<ge>m. \<phi> n = (\<lambda>x. if x = k then Some n else f x)"
+proof -
+  define psi :: "partial1 \<Rightarrow> nat \<Rightarrow> partial2" where
+    "psi = (\<lambda>f k i x. (if x = k then Some i else f x))"
+  have "psi f k \<in> \<R>\<^sup>2"
+  proof -
+    obtain r where r: "recfn 1 r" "total r" "eval r [x] = f x" for x
+      using assms by auto
+    define r_psi where
+      "r_psi = Cn 2 r_ifeq [Id 2 1, r_dummy 1 (r_const k), Id 2 0, Cn 2 r [Id 2 1]]"
+    show ?thesis
+    proof (rule R2I[of r_psi])
+      from r_psi_def show "recfn 2 r_psi"
+        using r(1) by simp
+      have "eval r_psi [i, x] = (if x = k then Some i else f x)" for i x
+      proof -
+        have "eval (Cn 2 r [Id 2 1]) [i, x] = f x"
+          using r by simp
+        then have "eval r_psi [i, x] = eval r_ifeq [x, k, i, the (f x)]"
+          unfolding r_psi_def using \<open>recfn 2 r_psi\<close> r R1_imp_total1[OF assms]
+          by simp
+        then show ?thesis using assms by simp
+      qed
+      then show "\<And>x y. eval r_psi [x, y] = psi f k x y"
+        unfolding psi_def by simp
+      then show "total r_psi"
+        using totalI2[of r_psi] \<open>recfn 2 r_psi\<close> assms psi_def by fastforce
+    qed
+  qed
+  then obtain n where "n \<ge> m" "\<phi> n = psi f k n"
+    using assms kleene_fixed_point[of "psi f k" m] by auto
+  then show ?thesis unfolding psi_def by auto
+qed
+
+lemma U_LIMCONS_prefix_complete:
+  assumes "length vs > 0"
+  shows "\<exists>f\<in>U\<^bsub>LIM-CONS\<^esub>. prefix f (length vs - 1) = vs"
+proof -
+  let ?p = "\<lambda>_. Some 0"
+  let ?f = "vs @ [0] \<odot> ?p"
+  have "?f \<in> \<R>"
+    using prepend_in_R1 RPred1_subseteq_R1 const0_in_RPred1 by blast
+  with goedel_at[of ?f 2 "length vs"] obtain j where
+    j: "j \<ge> 2" "\<phi> j = (\<lambda>x. if x = length vs then Some j else ?f x)" (is "_ = ?g")
+    by auto
+  moreover have g: "?g x = (vs @ [j] \<odot> ?p) x" for x
+    by (simp add: nth_append)
+  ultimately have "?g \<in> U\<^bsub>LIM-CONS\<^esub>"
+    unfolding U_LIMCONS_def using const0_in_RPred1 by fastforce
+  moreover have "prefix ?g (length vs - 1) = vs"
+    using g assms prefixI prepend_associative by auto
+  ultimately show ?thesis by auto
+qed
+
+text \<open>Roughly speaking, a strategy learning a prefix-complete class
+must be total because it must be defined for every prefix in
+the class. Technically, however, the empty list is not a prefix, and thus a
+strategy may diverge on input 0. We can work around this by
+showing that if there is a strategy learning a prefix-complete class then
+there is also a total strategy learning this class. We need the result only
+for consistent learning.\<close>
+
+lemma U_prefix_complete_imp_total_strategy:
+  assumes "\<And>vs. length vs > 0 \<Longrightarrow> \<exists>f\<in>U. prefix f (length vs - 1) = vs"
+    and "learn_cons \<psi> U s"
+  shows "\<exists>t. total1 t \<and> learn_cons \<psi> U t"
+proof -
+  define t where "t = (\<lambda>e. if e = 0 then Some 0 else s e)"
+  have "s e \<down>" if "e > 0" for e
+  proof -
+    from that have "list_decode e \<noteq> []" (is "?vs \<noteq> _")
+      using list_encode_0 list_encode_decode by (metis less_imp_neq)
+    then have "length ?vs > 0" by simp
+    with assms(1) obtain f where f: "f \<in> U" "prefix f (length ?vs - 1) = ?vs"
+      by auto
+    with learn_cons_def learn_limE have "s (f \<triangleright> (length ?vs - 1)) \<down>"
+      using assms(2) by auto
+    then show "s e \<down>"
+      using f(2) init_def by auto
+  qed
+  then have "total1 t"
+    using t_def by auto
+  have "t \<in> \<P>"
+  proof -
+    from assms(2) have "s \<in> \<P>"
+      using learn_consE by simp
+    then obtain rs where rs: "recfn 1 rs" "eval rs [x] = s x" for x
+      by auto
+    define rt where "rt = Cn 1 (r_lifz Z rs) [Id 1 0, Id 1 0]"
+    then have "recfn 1 rt"
+      using rs by auto
+    moreover have "eval rt [x] = t x" for x
+      using rs rt_def t_def by simp
+    ultimately show ?thesis by blast
+  qed
+  have "s (f \<triangleright> n) = t (f \<triangleright> n)" if "f \<in> U" for f n
+    unfolding t_def by (simp add: init_neq_zero)
+  then have "learn_cons \<psi> U t"
+    using `t \<in> \<P>` assms(2) learn_consE[of \<psi> U s] learn_consI[of \<psi> U t] by simp
+  with `total1 t` show ?thesis by auto
+qed
+
+text \<open>The proof of @{prop "U\<^bsub>LIM-CONS\<^esub> \<notin> CONS"} is by contradiction.
+Assume there is a consistent learning strategy $S$. By the previous
+lemma $S$ can be assumed to be total. Moreover it outputs a consistent
+hypothesis for every prefix. Thus for every $e \in \mathbb{N}^+$, $S(e) \neq
+S(e0)$ or $S(e) \neq S(e1)$ because $S(e)$ cannot be consistent with both
+$e0$ and $e1$. We use this property of $S$ to construct a function in @{term
+"U\<^bsub>LIM-CONS\<^esub>"} for which $S$ fails as a learning strategy. To
+this end we define a numbering $\psi \in \mathcal{R}^2$ with $\psi_i(0) = i$
+and
+\[
+\psi_i(x + 1) = \left\{\begin{array}{ll}
+    0 & \mbox{if } S(\psi_i^x0) \neq S(\psi_i^x),\\
+    1 & \mbox{otherwise}.
+\end{array}\right.
+\]
+This numbering is recursive because $S$ is total. The ``otherwise'' case is
+equivalent to $S(\psi_i^x1) \neq S(\psi_i^x)$ because $S(\psi_i^x)$ cannot be
+consistent with both $\psi_i^x0$ and $\psi_i^x1$. Therefore every prefix
+$\psi_i^x$ is extended in such a way that $S$ changes its hypothesis. Hence
+$S$ does not learn $\psi_i$ in the limit. Kleene's fixed-point theorem
+ensures that for some $j \geq 2$, $\varphi_j = \psi_j$. This $\psi_j$ is the
+sought function in @{term "U\<^bsub>LIM-CONS\<^esub>"}.
+
+The following locale formalizes the construction of $\psi$ for a total
+strategy $S$.\<close>
+
+locale cons_lim =
+  fixes s :: partial1
+  assumes s_in_R1: "s \<in> \<R>"
+begin
+
+text \<open>A @{typ recf} computing the strategy:\<close>
+
+definition r_s :: recf where
+  "r_s \<equiv> SOME r_s. recfn 1 r_s \<and>  total r_s \<and> s = (\<lambda>x. eval r_s [x])"
+
+lemma r_s_recfn [simp]: "recfn 1 r_s"
+  and r_s_total [simp]: "\<And>x. eval r_s [x] \<down>"
+  and eval_r_s: "s = (\<lambda>x. eval r_s [x])"
+  using r_s_def R1_SOME[OF s_in_R1, of r_s] by simp_all
+
+text \<open>The next function represents the prefixes of $\psi_i$.\<close>
+
+fun prefixes :: "nat \<Rightarrow> nat \<Rightarrow> nat list" where
+  "prefixes i 0 = [i]"
+| "prefixes i (Suc x) = (prefixes i x) @
+    [if s (e_snoc (list_encode (prefixes i x)) 0) = s (list_encode (prefixes i x))
+     then 1 else 0]"
+
+definition "r_prefixes_aux \<equiv>
+  Cn 3 r_ifeq
+   [Cn 3 r_s [Cn 3 r_snoc [Id 3 1, r_constn 2 0]],
+    Cn 3 r_s [Id 3 1],
+    Cn 3 r_snoc [Id 3 1, r_constn 2 1],
+    Cn 3 r_snoc [Id 3 1, r_constn 2 0]]"
+
+lemma r_prefixes_aux_recfn: "recfn 3 r_prefixes_aux"
+  unfolding r_prefixes_aux_def by simp
+
+lemma r_prefixes_aux:
+  "eval r_prefixes_aux [j, v, i] \<down>=
+    e_snoc v (if eval r_s [e_snoc v 0] = eval r_s [v] then 1 else 0)"
+  unfolding r_prefixes_aux_def by auto
+
+definition "r_prefixes \<equiv> r_swap (Pr 1 r_singleton_encode r_prefixes_aux)"
+
+lemma r_prefixes_recfn: "recfn 2 r_prefixes"
+  unfolding r_prefixes_def r_prefixes_aux_def by simp
+
+lemma r_prefixes: "eval r_prefixes [i, n] \<down>= list_encode (prefixes i n)"
+proof -
+  let ?h = "Pr 1 r_singleton_encode r_prefixes_aux"
+  have "eval ?h [n, i] \<down>= list_encode (prefixes i n)"
+  proof (induction n)
+    case 0
+    then show ?case
+      using r_prefixes_def r_prefixes_aux_recfn r_singleton_encode by simp
+  next
+    case (Suc n)
+    then show ?case
+      using r_prefixes_aux_recfn r_prefixes_aux eval_r_s
+      by auto metis+
+  qed
+  moreover have "eval ?h [n, i] = eval r_prefixes [i, n]" for i n
+    unfolding r_prefixes_def by (simp add: r_prefixes_aux_recfn)
+  ultimately show ?thesis by simp
+qed
+
+lemma prefixes_neq_nil: "length (prefixes i x) > 0"
+  by (induction x) auto
+
+text \<open>The actual numbering can then be defined via @{term prefixes}.\<close>
+
+definition psi :: "partial2" ("\<psi>") where
+  "\<psi> i x \<equiv> Some (last (prefixes i x))"
+
+lemma psi_in_R2: "\<psi> \<in> \<R>\<^sup>2"
+proof
+  define r_psi where "r_psi \<equiv> Cn 2 r_last [r_prefixes]"
+  have "recfn 2 r_psi"
+    unfolding r_psi_def by (simp add: r_prefixes_recfn)
+  then have "eval r_psi [i, n] \<down>= last (prefixes i n)" for n i
+    unfolding r_psi_def using r_prefixes r_prefixes_recfn prefixes_neq_nil by simp
+  then have "(\<lambda>i x. Some (last (prefixes i x))) \<in> \<P>\<^sup>2"
+    using `recfn 2 r_psi` P2I[of "r_psi"] by simp
+  with psi_def show "\<psi> \<in> \<P>\<^sup>2" by presburger
+  moreover show "total2 psi"
+    unfolding psi_def by auto
+qed
+
+lemma psi_0_or_1:
+  assumes "n > 0"
+  shows "\<psi> i n \<down>= 0 \<or> \<psi> i n \<down>= 1"
+proof -
+  from assms obtain m where "n = Suc m"
+    using gr0_implies_Suc by blast
+  then have "last (prefixes i (Suc m)) = 0 \<or> last (prefixes i (Suc m)) = 1"
+    by simp
+  then show ?thesis using \<open>n = Suc m\<close> psi_def by simp
+qed
+
+text \<open>The function @{term "prefixes"} does indeed provide the prefixes
+for @{term "\<psi>"}.\<close>
+
+lemma psi_init: "(\<psi> i) \<triangleright> x = list_encode (prefixes i x)"
+proof -
+  have "prefix (\<psi> i) x = prefixes i x"
+    unfolding psi_def
+    by (induction x) (simp_all add: prefix_0 prefix_Suc)
+  with init_def show ?thesis by simp
+qed
+
+text \<open>One of the functions $\psi_i$ is in @{term "U\<^bsub>LIM-CONS\<^esub>"}.\<close>
+
+lemma ex_psi_in_U: "\<exists>j. \<psi> j \<in> U\<^bsub>LIM-CONS\<^esub>"
+proof -
+  obtain j where j: "j \<ge> 2" "\<psi> j = \<phi> j"
+    using kleene_fixed_point[of \<psi>] psi_in_R2 R2_imp_P2 by metis
+  then have "\<psi> j \<in> \<P>" by (simp add: phi_in_P2)
+  define p where "p = (\<lambda>x. \<psi> j (x + 1))"
+  have "p \<in> \<R>\<^sub>0\<^sub>1"
+  proof -
+    from p_def `\<psi> j \<in> \<P>` skip_P1 have "p \<in> \<P>" by blast
+    from psi_in_R2 have "total1 (\<psi> j)" by simp
+    with p_def have "total1 p"
+      by (simp add: total1_def)
+    with psi_0_or_1 have "p n \<down>= 0 \<or> p n \<down>= 1" for n
+      using psi_def p_def by simp
+    then show ?thesis
+      by (simp add: RPred1_def P1_total_imp_R1 \<open>p \<in> \<P>\<close> \<open>total1 p\<close>)
+  qed
+  moreover have "\<psi> j = [j] \<odot> p"
+  proof
+    fix x
+    show "\<psi> j x = ([j] \<odot> p) x"
+    proof (cases "x = 0")
+      case True
+      then show ?thesis using psi_def psi_def prepend_at_less by simp
+    next
+      case False
+      then show ?thesis using p_def by simp
+    qed
+  qed
+  ultimately have "\<psi> j \<in> U\<^bsub>LIM-CONS\<^esub>"
+    using j U_LIMCONS_def by (metis (mono_tags, lifting) append_Nil mem_Collect_eq)
+  then show ?thesis by auto
+qed
+
+text \<open>The strategy fails to learn @{term U_LIMCONS} because it changes
+its hypothesis all the time on functions $\psi_j \in V_0$.\<close>
+
+lemma U_LIMCONS_not_learn_cons: "\<not> learn_cons \<phi> U\<^bsub>LIM-CONS\<^esub> s"
+proof
+  assume learn: "learn_cons \<phi> U\<^bsub>LIM-CONS\<^esub> s"
+  have "s (list_encode (vs @ [0])) \<noteq> s (list_encode (vs @ [1]))" for vs
+  proof -
+    obtain f\<^sub>0 where f0: "f\<^sub>0 \<in> U\<^bsub>LIM-CONS\<^esub>" "prefix f\<^sub>0 (length vs) = vs @ [0]"
+      using U_LIMCONS_prefix_complete[of "vs @ [0]"] by auto
+    obtain f\<^sub>1 where f1: "f\<^sub>1 \<in> U\<^bsub>LIM-CONS\<^esub>" "prefix f\<^sub>1 (length vs) = vs @ [1]"
+      using U_LIMCONS_prefix_complete[of "vs @ [1]"] by auto
+    have "f\<^sub>0 (length vs) \<noteq> f\<^sub>1 (length vs)"
+      using f0 f1 by (metis lessI nth_append_length prefix_nth zero_neq_one)
+    moreover have "\<phi> (the (s (f\<^sub>0 \<triangleright> length vs))) (length vs) = f\<^sub>0 (length vs)"
+      using learn_consE(3)[of \<phi> U_LIMCONS s, OF learn, of f\<^sub>0 "length vs", OF f0(1)]
+      by simp
+    moreover have "\<phi> (the (s (f\<^sub>1 \<triangleright> length vs))) (length vs) = f\<^sub>1 (length vs)"
+      using learn_consE(3)[of \<phi> U_LIMCONS s, OF learn, of f\<^sub>1 "length vs", OF f1(1)]
+      by simp
+    ultimately have "the (s (f\<^sub>0 \<triangleright> length vs)) \<noteq> the (s (f\<^sub>1 \<triangleright> length vs))"
+      by auto
+    then have "s (f\<^sub>0 \<triangleright> length vs) \<noteq> s (f\<^sub>1 \<triangleright> length vs)"
+      by auto
+    with f0(2) f1(2) show ?thesis by (simp add: init_def)
+  qed
+  then have "s (list_encode (vs @ [0])) \<noteq> s (list_encode vs) \<or>
+      s (list_encode (vs @ [1])) \<noteq> s (list_encode vs)"
+      for vs
+    by metis
+  then have "s (list_encode (prefixes i (Suc x))) \<noteq> s (list_encode (prefixes i x))" for i x
+    by simp
+  then have "\<not> learn_lim \<phi> {\<psi> i} s" for i
+    using psi_def psi_init always_hyp_change_not_Lim by simp
+  then have "\<not> learn_lim \<phi> U_LIMCONS s"
+    using ex_psi_in_U learn_lim_closed_subseteq by blast
+  then show False
+    using learn learn_cons_def by simp
+qed
+
+end
+
+text \<open>With the locale we can now show the second part of the main
+result:\<close>
+
+lemma U_LIMCONS_not_in_CONS: "U\<^bsub>LIM-CONS\<^esub> \<notin> CONS"
+proof
+  assume "U\<^bsub>LIM-CONS\<^esub> \<in> CONS"
+  then have "U\<^bsub>LIM-CONS\<^esub> \<in> CONS_wrt \<phi>"
+    by (simp add: CONS_wrt_phi_eq_CONS)
+  then obtain almost_s where "learn_cons \<phi> U\<^bsub>LIM-CONS\<^esub> almost_s"
+    using CONS_wrt_def by auto
+  then obtain s where s: "total1 s" "learn_cons \<phi> U\<^bsub>LIM-CONS\<^esub> s"
+    using U_LIMCONS_prefix_complete U_prefix_complete_imp_total_strategy by blast
+  then have "s \<in> \<R>"
+    using learn_consE(1) P1_total_imp_R1 by blast
+  with cons_lim_def interpret cons_lim s by simp
+  show False
+    using s(2) U_LIMCONS_not_learn_cons by simp
+qed
+
+text \<open>The main result of this section:\<close>
+
+theorem CONS_subset_Lim: "CONS \<subset> LIM"
+  using U_LIMCONS_in_Lim U_LIMCONS_not_in_CONS CONS_subseteq_Lim by auto
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/CP_FIN_NUM.thy b/thys/Inductive_Inference/CP_FIN_NUM.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/CP_FIN_NUM.thy
@@ -0,0 +1,1032 @@
+section \<open>FIN is a proper subset of CP\label{s:fin_cp}\<close>
+
+theory CP_FIN_NUM
+  imports Inductive_Inference_Basics
+begin
+
+text \<open>Let $S$ be a FIN strategy for a non-empty class $U$. Let $T$ be a
+strategy that hypothesizes an arbitrary function from $U$ while $S$ outputs
+``don't know'' and the hypothesis of $S$ otherwise. Then $T$ is a CP strategy
+for $U$.\<close>
+
+lemma nonempty_FIN_wrt_impl_CP:
+  assumes "U \<noteq> {}" and "U \<in> FIN_wrt \<psi>"
+  shows "U \<in> CP_wrt \<psi>"
+proof -
+  obtain s where "learn_fin \<psi> U s"
+    using assms(2) FIN_wrt_def  by auto
+  then have env: "environment \<psi> U s" and
+    fin: "\<And>f. f \<in> U \<Longrightarrow>
+      \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+    using learn_finE by auto
+  from assms(1) obtain f\<^sub>0 where "f\<^sub>0 \<in> U"
+    by auto
+  with fin obtain i\<^sub>0 where "\<psi> i\<^sub>0 = f\<^sub>0"
+    by blast
+  define t where "t x \<equiv>
+    (if s x \<up> then None else if s x \<down>= 0 then Some i\<^sub>0 else Some (the (s x) - 1))"
+    for x
+  have "t \<in> \<P>"
+  proof -
+    from env obtain rs where rs: "recfn 1 rs" "\<And>x. eval rs [x] = s x"
+      by auto
+    define rt where "rt = Cn 1 r_ifz [rs, r_const i\<^sub>0, Cn 1 r_dec [rs]]"
+    then have "recfn 1 rt"
+      using rs(1) by simp
+    then have "eval rt [x] \<down>= (if s x \<down>= 0 then i\<^sub>0 else (the (s x)) - 1)" if "s x \<down>" for x
+      using rs rt_def that by auto
+    moreover have "eval rt [x] \<up>" if "eval rs [x] \<up>" for x
+      using rs rt_def that by simp
+    ultimately have "eval rt [x] = t x" for x
+      using rs(2) t_def by simp
+    with \<open>recfn 1 rt\<close> show ?thesis by auto
+  qed
+  have "learn_cp \<psi> U t"
+  proof (rule learn_cpI)
+    show "environment \<psi> U t"
+      using env t_def \<open>t \<in> \<P>\<close> by simp
+    show "\<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. t (f \<triangleright> n) \<down>= i)" if "f \<in> U" for f
+    proof -
+      from that fin obtain i n\<^sub>0 where
+        i: "\<psi> i = f" "\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0" "\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i"
+        by blast
+      moreover have "\<forall>n\<ge>n\<^sub>0. t (f \<triangleright> n) \<down>= i"
+        using that t_def i(3) by simp
+      ultimately show ?thesis by auto
+    qed
+    show "\<psi> (the (t (f \<triangleright> n))) \<in> U" if "f \<in> U" for f n
+      using \<open>\<psi> i\<^sub>0 = f\<^sub>0\<close> \<open>f\<^sub>0 \<in> U\<close> t_def fin env that
+      by (metis (no_types, lifting) diff_Suc_1 not_less option.sel)
+  qed
+  then show ?thesis using CP_wrt_def env by auto
+qed
+
+lemma FIN_wrt_impl_CP:
+  assumes "U \<in> FIN_wrt \<psi>"
+  shows "U \<in> CP_wrt \<psi>"
+proof (cases "U = {}")
+  case True
+  then have "\<psi> \<in> \<P>\<^sup>2 \<Longrightarrow> U \<in> CP_wrt \<psi>"
+    using CP_wrt_def learn_cpI[of \<psi> "{}" "\<lambda>x. Some 0"] const_in_Prim1 by auto
+  moreover have "\<psi> \<in> \<P>\<^sup>2"
+    using assms FIN_wrt_def learn_finE by auto
+  ultimately show "U \<in> CP_wrt \<psi>" by simp
+next
+  case False
+  with nonempty_FIN_wrt_impl_CP assms show ?thesis
+    by simp
+qed
+
+corollary FIN_subseteq_CP: "FIN \<subseteq> CP"
+proof
+  fix U
+  assume "U \<in> FIN"
+  then have "\<exists>\<psi>. U \<in> FIN_wrt \<psi>"
+    using FIN_def FIN_wrt_def by auto
+  then have "\<exists>\<psi>. U \<in> CP_wrt \<psi>"
+    using FIN_wrt_impl_CP by auto
+  then show "U \<in> CP"
+    by (simp add: CP_def CP_wrt_def)
+qed
+
+text \<open>In order to show the \emph{proper} inclusion, we show @{term
+"U\<^sub>0 \<in> CP - FIN"}. A CP strategy for @{term "U\<^sub>0"} simply
+hypothesizes the function in @{term U0} with the longest prefix of $f^n$ not
+ending in zero. For that we define a function computing the index of the
+rightmost non-zero value in a list, returning the length of the list if there
+is no such value.\<close>
+
+definition findr :: partial1 where
+  "findr e \<equiv>
+    if \<exists>i<e_length e. e_nth e i \<noteq> 0
+    then Some (GREATEST i. i < e_length e \<and> e_nth e i \<noteq> 0)
+    else Some (e_length e)"
+
+lemma findr_total: "findr e \<down>"
+  unfolding findr_def by simp
+
+lemma findr_ex:
+  assumes "\<exists>i<e_length e. e_nth e i \<noteq> 0"
+  shows "the (findr e) < e_length e"
+    and "e_nth e (the (findr e)) \<noteq> 0"
+    and "\<forall>i. the (findr e) < i \<and> i < e_length e \<longrightarrow> e_nth e i = 0"
+proof -
+  let ?P = "\<lambda>i. i < e_length e \<and> e_nth e i \<noteq> 0"
+  from assms have "\<exists>i. ?P i" by simp
+  then have "?P (Greatest ?P)"
+    using GreatestI_ex_nat[of ?P "e_length e"] by fastforce
+  moreover have *: "findr e = Some (Greatest ?P)"
+    using assms findr_def by simp
+  ultimately show "the (findr e) < e_length e" and "e_nth e (the (findr e)) \<noteq> 0"
+    by fastforce+
+  show "\<forall>i. the (findr e) < i \<and> i < e_length e \<longrightarrow> e_nth e i = 0"
+    using * Greatest_le_nat[of ?P _ "e_length e"] by fastforce
+qed
+
+definition "r_findr \<equiv>
+  let g =
+    Cn 3 r_ifz
+     [Cn 3 r_nth [Id 3 2, Id 3 0],
+      Cn 3 r_ifeq [Id 3 0, Id 3 1, Cn 3 S [Id 3 0], Id 3 1],
+      Id 3 0]
+  in Cn 1 (Pr 1 Z g) [Cn 1 r_length [Id 1 0], Id 1 0]"
+
+lemma r_findr_prim [simp]: "prim_recfn 1 r_findr"
+  unfolding r_findr_def by simp
+
+lemma r_findr [simp]: "eval r_findr [e] = findr e"
+proof -
+  define g where "g =
+    Cn 3 r_ifz
+     [Cn 3 r_nth [Id 3 2, Id 3 0],
+      Cn 3 r_ifeq [Id 3 0, Id 3 1, Cn 3 S [Id 3 0], Id 3 1],
+      Id 3 0]"
+  then have "recfn 3 g"
+    by simp
+  with g_def have g: "eval g [j, r, e] \<down>=
+      (if e_nth e j \<noteq> 0 then j else if j = r then Suc j else r)" for j r e
+    by simp
+  let ?h = "Pr 1 Z g"
+  have "recfn 2 ?h"
+    by (simp add: \<open>recfn 3 g\<close>)
+  let ?P = "\<lambda>e j i. i < j \<and> e_nth e i \<noteq> 0"
+  let ?G = "\<lambda>e j. Greatest (?P e j)"
+  have h: "eval ?h [j, e] =
+    (if \<forall>i<j. e_nth e i = 0 then Some j else Some (?G e j))" for j e
+  proof (induction j)
+    case 0
+    then show ?case using \<open>recfn 2 ?h\<close> by auto
+  next
+    case (Suc j)
+    then have "eval ?h [Suc j, e] = eval g [j, the (eval ?h [j, e]), e]"
+      using \<open>recfn 2 ?h\<close> by auto
+    then have "eval ?h [Suc j, e] =
+        eval g [j, if \<forall>i<j. e_nth e i = 0 then j else ?G e j, e]"
+      using Suc by auto
+    then have *: "eval ?h [Suc j, e] \<down>=
+      (if e_nth e j \<noteq> 0 then j
+       else if j = (if \<forall>i<j. e_nth e i = 0 then j else ?G e j)
+            then Suc j
+            else (if \<forall>i<j. e_nth e i = 0 then j else ?G e j))"
+      using g by simp
+    show ?case
+    proof (cases "\<forall>i<Suc j. e_nth e i = 0")
+      case True
+      then show ?thesis using * by simp
+    next
+      case False
+      then have ex: "\<exists>i<Suc j. e_nth e i \<noteq> 0"
+        by auto
+      show ?thesis
+      proof (cases "e_nth e j = 0")
+        case True
+        then have ex': "\<exists>i<j. e_nth e i \<noteq> 0"
+          using ex less_Suc_eq by fastforce
+        then have "(if \<forall>i<j. e_nth e i = 0 then j else ?G e j) = ?G e j"
+          by metis
+        moreover have "?G e j < j"
+          using ex' GreatestI_nat[of "?P e j"] less_imp_le_nat by blast
+        ultimately have "eval ?h [Suc j, e] \<down>= ?G e j"
+          using * True by simp
+        moreover have "?G e j = ?G e (Suc j)"
+          using True by (metis less_SucI less_Suc_eq)
+        ultimately show ?thesis using ex by metis
+      next
+        case False
+        then have "eval ?h [Suc j, e] \<down>= j"
+          using * by simp
+        moreover have "?G e (Suc j) = j"
+          using ex False Greatest_equality[of "?P e (Suc j)"] by simp
+        ultimately show ?thesis using ex by simp
+      qed
+    qed
+  qed
+  let ?hh = "Cn 1 ?h [Cn 1 r_length [Id 1 0], Id 1 0]"
+  have "recfn 1 ?hh"
+    using `recfn 2 ?h` by simp
+  with h have hh: "eval ?hh [e] \<down>=
+      (if \<forall>i<e_length e. e_nth e i = 0 then e_length e else ?G e (e_length e))" for e
+    by auto
+  then have "eval ?hh [e] = findr e" for e
+    unfolding findr_def by auto
+  moreover have "total ?hh"
+    using hh totalI1 `recfn 1 ?hh` by simp
+  ultimately show ?thesis
+    using `recfn 1 ?hh` g_def r_findr_def findr_def by metis
+qed
+
+lemma U0_in_CP: "U\<^sub>0 \<in> CP"
+proof -
+  define s where
+    "s \<equiv> \<lambda>x. if findr x \<down>= e_length x then Some 0 else Some (e_take (Suc (the (findr x))) x)"
+  have "s \<in> \<P>"
+  proof -
+    define r where
+      "r \<equiv> Cn 1 r_ifeq [r_findr, r_length, Z, Cn 1 r_take [Cn 1 S [r_findr], Id 1 0]]"
+    then have "\<And>x. eval r [x] = s x"
+      using s_def findr_total by fastforce
+    moreover have "recfn 1 r"
+      using r_def by simp
+    ultimately show ?thesis by auto
+  qed
+  moreover have "learn_cp prenum U\<^sub>0 s"
+  proof (rule learn_cpI)
+    show "environment prenum U\<^sub>0 s"
+      using \<open>s \<in> \<P>\<close> s_def prenum_in_R2 U0_in_NUM by auto
+    show "\<exists>i. prenum i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)" if "f \<in> U\<^sub>0" for f
+    proof (cases "f = (\<lambda>_. Some 0)")
+      case True
+      then have "s (f \<triangleright> n) \<down>= 0" for n
+        using findr_def s_def by simp
+      then have "\<forall>n\<ge>0. s (f \<triangleright> n) \<down>= 0" by simp
+      moreover have "prenum 0 = f"
+        using True by auto
+      ultimately show ?thesis by auto
+    next
+      case False
+      then obtain ws where ws: "length ws > 0" "last ws \<noteq> 0" "f = ws \<odot> 0\<^sup>\<infinity>"
+        using U0_def \<open>f \<in> U\<^sub>0\<close> almost0_canonical by blast
+      let ?m = "length ws - 1"
+      let ?i = "list_encode ws"
+      have "prenum ?i = f"
+        using ws by auto
+      moreover have "s (f \<triangleright> n) \<down>= ?i" if "n \<ge> ?m" for n
+      proof -
+        have "e_nth (f \<triangleright> n) ?m \<noteq> 0"
+          using ws that by (simp add: last_conv_nth)
+        then have "\<exists>k<Suc n. e_nth (f \<triangleright> n) k \<noteq> 0"
+          using le_imp_less_Suc that by blast
+        moreover have
+          "(GREATEST k. k < e_length (f \<triangleright> n) \<and> e_nth (f \<triangleright> n) k \<noteq> 0) = ?m"
+        proof (rule Greatest_equality)
+          show "?m < e_length (f \<triangleright> n) \<and> e_nth (f \<triangleright> n) ?m \<noteq> 0"
+            using \<open>e_nth (f \<triangleright> n) ?m \<noteq> 0\<close> that by auto
+          show "\<And>y. y < e_length (f \<triangleright> n) \<and> e_nth (f \<triangleright> n) y \<noteq> 0 \<Longrightarrow> y \<le> ?m"
+            using ws less_Suc_eq_le by fastforce
+        qed
+        ultimately have "findr (f \<triangleright> n) \<down>= ?m"
+          using that findr_def by simp
+        moreover have "?m < e_length (f \<triangleright> n)"
+          using that by simp
+        ultimately have "s (f \<triangleright> n) \<down>= e_take (Suc ?m) (f \<triangleright> n)"
+          using s_def by simp
+        moreover have "e_take (Suc ?m) (f \<triangleright> n) = list_encode ws"
+        proof -
+          have "take (Suc ?m) (prefix f n) = prefix f ?m"
+            using take_prefix[of f ?m n] ws that by (simp add: almost0_in_R1)
+          then have "take (Suc ?m) (prefix f n) = ws"
+            using ws prefixI by auto
+          then show ?thesis by simp
+        qed
+        ultimately show ?thesis by simp
+      qed
+      ultimately show ?thesis by auto
+    qed
+    show "\<And>f n. f \<in> U\<^sub>0 \<Longrightarrow> prenum (the (s (f \<triangleright> n))) \<in> U\<^sub>0"
+      using U0_def by fastforce
+  qed
+  ultimately show ?thesis using CP_def by blast
+qed
+
+text \<open>As a bit of an interlude, we can now show that CP is not
+closed under the subset relation. This works by removing functions from
+@{term "U\<^sub>0"} in a ``noncomputable'' way such that a strategy cannot ensure
+that every intermediate hypothesis is in that new class.\<close>
+
+lemma CP_not_closed_subseteq: "\<exists>V U. V \<subseteq> U \<and> U \<in> CP \<and> V \<notin> CP"
+proof -
+  \<comment> \<open>The numbering $g\in\mathcal{R}^2$ enumerates all
+  functions $i0^\infty \in U_0$.\<close>
+  define g where "g \<equiv> \<lambda>i. [i] \<odot>  0\<^sup>\<infinity>"
+  have g_inj: "i = j" if "g i = g j" for i j
+  proof -
+    have "g i 0 \<down>= i" and "g j 0 \<down>= j"
+      by (simp_all add: g_def)
+    with that show "i = j"
+      by (metis option.inject)
+  qed
+
+  \<comment> \<open>Define a class $V$. If the strategy $\varphi_i$ learns
+  $g_i$, it outputs a hypothesis for $g_i$ on some shortest prefix $g_i^m$.
+  Then the function $g_i^m10^\infty$ is included in the class $V$; otherwise
+  $g_i$ is included.\<close>
+  define V where "V \<equiv>
+    {if learn_lim \<phi> {g i} (\<phi> i)
+     then (prefix (g i) (LEAST n. \<phi> (the (\<phi> i ((g i) \<triangleright> n))) = g i)) @ [1] \<odot> 0\<^sup>\<infinity>
+     else g i |
+     i. i \<in> UNIV}"
+  have "V \<notin> CP_wrt \<phi>"
+  proof
+    \<comment> \<open>Assuming $V \in CP_\varphi$, there is a CP strategy
+    $\varphi_i$ for $V$.\<close>
+    assume "V \<in> CP_wrt \<phi>"
+    then obtain s where s: "s \<in> \<P>" "learn_cp \<phi> V s"
+      using CP_wrt_def learn_cpE(1) by auto
+    then obtain i where i: "\<phi> i = s"
+      using phi_universal by auto
+
+    show False
+    proof (cases "learn_lim \<phi> {g i} (\<phi> i)")
+      case learn: True
+      \<comment> \<open>If $\varphi_i$ learns $g_i$, it hypothesizes $g_i$ on
+      some shortest prefix $g_i^m$. Thus it hypothesizes $g_i$ on some prefix
+      of $g_i^m10^\infty \in V$, too. But $g_i$ is not a class-preserving
+      hypothesis because $g_i \notin V$.\<close>
+      let ?P = "\<lambda>n. \<phi> (the (\<phi> i ((g i) \<triangleright>  n))) = g i"
+      let ?m = "Least ?P"
+      have "\<exists>n. ?P n"
+        using i s by (meson learn infinite_hyp_wrong_not_Lim insertI1 lessI)
+      then have "?P ?m"
+        using LeastI_ex[of ?P] by simp
+      define h where "h = (prefix (g i) ?m) @ [1] \<odot> 0\<^sup>\<infinity>"
+      then have "h \<in> V"
+        using V_def learn by auto
+      have "(g i) \<triangleright>  ?m = h \<triangleright>  ?m"
+      proof -
+        have "prefix (g i) ?m = prefix h ?m"
+          unfolding h_def by (simp add: prefix_prepend_less)
+        then show ?thesis by auto
+      qed
+      then have "\<phi> (the (\<phi> i (h \<triangleright>  ?m))) = g i"
+        using `?P ?m` by simp
+      moreover have "g i \<notin> V"
+      proof
+        assume "g i \<in> V"
+        then obtain j where j: "g i =
+          (if learn_lim \<phi> {g j} (\<phi> j)
+           then (prefix (g j) (LEAST n. \<phi> (the (\<phi> j ((g j) \<triangleright>  n))) = g j)) @ [1] \<odot> 0\<^sup>\<infinity>
+           else g j)"
+          using V_def by auto
+        show False
+        proof (cases "learn_lim \<phi> {g j} (\<phi> j)")
+          case True
+          then have "g i =
+              (prefix (g j) (LEAST n. \<phi> (the (\<phi> j ((g j) \<triangleright>  n))) = g j)) @ [1] \<odot> 0\<^sup>\<infinity>"
+              (is "g i = ?vs @ [1] \<odot> 0\<^sup>\<infinity>")
+            using j by simp
+          moreover have len: "length ?vs > 0" by simp
+          ultimately have "g i (length ?vs) \<down>= 1"
+            by (simp add: prepend_associative)
+          moreover have "g i (length ?vs) \<down>= 0"
+            using g_def len by simp
+          ultimately show ?thesis by simp
+        next
+          case False
+          then show ?thesis
+            using j g_inj learn by auto
+        qed
+      qed
+      ultimately have "\<phi> (the (\<phi> i (h \<triangleright>  ?m))) \<notin> V" by simp
+      then have "\<not> learn_cp \<phi> V (\<phi> i)"
+        using `h \<in> V` learn_cpE(3) by auto
+      then show ?thesis by (simp add: i s(2))
+    next
+      \<comment> \<open>If $\varphi_i$ does not learn $g_i$, then $g_i\in V$.
+      Hence $\varphi_i$ does not learn $V$.\<close>
+      case False
+      then have "g i \<in> V"
+        using V_def by auto
+      with False have "\<not> learn_lim \<phi> V (\<phi> i)"
+        using learn_lim_closed_subseteq by auto
+      then show ?thesis
+        using s(2) i by (simp add: learn_cp_def)
+    qed
+  qed
+  then have "V \<notin> CP"
+    using CP_wrt_phi by simp
+  moreover have "V \<subseteq> U\<^sub>0"
+    using V_def g_def U0_def by auto
+  ultimately show ?thesis using U0_in_CP by auto
+qed
+
+text \<open>Continuing with the main result of this section, we show that
+@{term "U\<^sub>0"} cannot be learned finitely. Any FIN strategy would have
+to output a hypothesis for the constant zero function on some prefix. But
+@{term "U\<^sub>0"} contains infinitely many other functions starting with
+the same prefix, which the strategy then would not learn finitely.\<close>
+
+lemma U0_not_in_FIN: "U\<^sub>0 \<notin> FIN"
+proof
+  assume "U\<^sub>0 \<in> FIN"
+  then obtain \<psi> s where "learn_fin \<psi> U\<^sub>0 s"
+    using FIN_def by blast
+  with learn_finE have cp: "\<And>f. f \<in> U\<^sub>0 \<Longrightarrow>
+      \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+    by simp_all
+
+  define z where "z = [] \<odot> 0\<^sup>\<infinity>"
+  then have "z \<in> U\<^sub>0"
+    using U0_def by auto
+  with cp obtain i n\<^sub>0 where i: "\<psi> i = z" and n0: "\<forall>n\<ge>n\<^sub>0. s (z \<triangleright> n) \<down>= Suc i"
+    by blast
+
+  define w where "w = replicate (Suc n\<^sub>0) 0 @ [1] \<odot> 0\<^sup>\<infinity>"
+  then have "prefix w n\<^sub>0 = replicate (Suc n\<^sub>0) 0"
+    by (simp add: prefix_prepend_less)
+  moreover have "prefix z n\<^sub>0 = replicate (Suc n\<^sub>0) 0"
+    using prefixI[of "replicate (Suc n\<^sub>0) 0" z] less_Suc_eq_0_disj unfolding z_def
+    by fastforce
+  ultimately have "z \<triangleright>  n\<^sub>0 = w \<triangleright> n\<^sub>0"
+    by (simp add: init_prefixE)
+  with n0 have *: "s (w \<triangleright> n\<^sub>0) \<down>= Suc i" by auto
+
+  have "w \<in> U\<^sub>0" using w_def U0_def by auto
+  with cp obtain i' n\<^sub>0' where i': "\<psi> i' = w"
+    and n0': "\<forall>n<n\<^sub>0'. s (w \<triangleright> n) \<down>= 0" "\<forall>n\<ge>n\<^sub>0'. s (w \<triangleright> n) \<down>= Suc i'"
+    by blast
+
+  have "i \<noteq> i'"
+  proof
+    assume "i = i'"
+    then have "w = z"
+      using i i' by simp
+    have "w (Suc n\<^sub>0) \<down>= 1"
+      using w_def prepend[of "replicate (Suc n\<^sub>0) 0 @ [1]" "0\<^sup>\<infinity>" "Suc n\<^sub>0"]
+      by (metis length_append_singleton length_replicate lessI nth_append_length)
+    moreover have "z (Suc n\<^sub>0) \<down>= 0"
+      using z_def by simp
+    ultimately show False
+      using \<open>w = z\<close> by simp
+  qed
+  then have "s (w \<triangleright> n\<^sub>0) \<down>\<noteq> Suc i"
+    using n0' by (cases "n\<^sub>0 < n\<^sub>0'") simp_all
+  with * show False by simp
+qed
+
+theorem FIN_subset_CP: "FIN \<subset> CP"
+  using U0_in_CP U0_not_in_FIN FIN_subseteq_CP by auto
+
+
+section \<open>NUM and FIN are incomparable\label{s:num_fin}\<close>
+
+text \<open>The class $V_0$ of all total recursive functions $f$ where $f(0)$
+is a Gödel number of $f$ can be learned finitely by always hypothesizing
+$f(0)$. The class is not in NUM and therefore serves to separate NUM and
+FIN.\<close>
+
+definition V0 :: "partial1 set" ("V\<^sub>0") where
+  "V\<^sub>0 = {f. f \<in> \<R> \<and> \<phi> (the (f 0)) = f}"
+
+lemma V0_altdef: "V\<^sub>0 = {[i] \<odot> f| i f. f \<in> \<R> \<and> \<phi> i = [i] \<odot> f}"
+  (is "V\<^sub>0 = ?W")
+proof
+  show "V\<^sub>0 \<subseteq> ?W"
+  proof
+    fix f
+    assume "f \<in> V\<^sub>0"
+    then have "f \<in> \<R>"
+      unfolding V0_def by simp
+    then obtain i where i: "f 0 \<down>= i" by fastforce
+    define g where "g = (\<lambda>x. f (x + 1))"
+    then have "g \<in> \<R>"
+      using skip_R1[OF `f \<in> \<R>`] by blast
+    moreover have "[i] \<odot> g = f"
+      using g_def i by auto
+    moreover have "\<phi> i = f"
+      using `f \<in> V\<^sub>0` V0_def i by force
+    ultimately show "f \<in> ?W" by auto
+  qed
+  show "?W \<subseteq> V\<^sub>0"
+  proof
+    fix g
+    assume "g \<in> ?W"
+    then have "\<phi> (the (g 0)) = g" by auto
+    moreover have "g \<in> \<R>"
+      using prepend_in_R1 `g \<in> ?W` by auto
+    ultimately show "g \<in> V\<^sub>0"
+      by (simp add: V0_def)
+  qed
+qed
+
+lemma V0_in_FIN: "V\<^sub>0 \<in> FIN"
+proof -
+  define s where "s = (\<lambda>x. Some (Suc (e_hd x)))"
+  have "s \<in> \<P>"
+  proof -
+    define r where "r = Cn 1 S [r_hd]"
+    then have "recfn 1 r" by simp
+    moreover have "eval r [x] \<down>= Suc (e_hd x)" for x
+      unfolding r_def by simp
+    ultimately show ?thesis
+      using s_def by blast
+  qed
+  have s: "s (f \<triangleright> n) \<down>= Suc (the (f 0))" for f n
+    unfolding s_def by simp
+  have "learn_fin \<phi> V\<^sub>0 s"
+  proof (rule learn_finI)
+    show "environment \<phi> V\<^sub>0 s"
+      using s_def \<open>s \<in> \<P>\<close> phi_in_P2 V0_def by auto
+    show "\<exists>i n\<^sub>0. \<phi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+        if "f \<in> V\<^sub>0" for f
+      using that V0_def s by auto
+  qed
+  then show ?thesis using FIN_def by auto
+qed
+
+text \<open>To every @{term "f \<in> \<R>"} a number can be prepended that is
+a Gödel number of the resulting function. Such a function is then in $V_0$.
+
+If $V_0$ was in NUM, it would be embedded in a total numbering. Shifting this
+numbering to the left, essentially discarding the values at point $0$, would
+yield a total numbering for @{term "\<R>"}, which contradicts @{thm[source]
+R1_not_in_NUM}. This proves @{prop "V\<^sub>0 \<notin> NUM"}.\<close>
+
+lemma prepend_goedel:
+  assumes "f \<in> \<R>"
+  shows "\<exists>i. \<phi> i = [i] \<odot> f"
+proof -
+  obtain r where r: "recfn 1 r" "total r" "\<And>x. eval r [x] = f x"
+    using assms by auto
+  define r_psi where "r_psi = Cn 2 r_ifz [Id 2 1, Id 2 0, Cn 2 r [Cn 2 r_dec [Id 2 1]]]"
+  then have "recfn 2 r_psi"
+    using r(1) by simp
+  have "eval r_psi [i, x] = (if x = 0 then Some i else f (x - 1))" for i x
+  proof -
+    have "eval (Cn 2 r [Cn 2 r_dec [Id 2 1]]) [i, x] = f (x - 1)"
+      using r by simp
+    then have "eval r_psi [i, x] = eval r_ifz [x, i, the (f (x - 1))]"
+      unfolding r_psi_def using \<open>recfn 2 r_psi\<close> r R1_imp_total1[OF assms] by auto
+    then show ?thesis
+      using assms by simp
+  qed
+  with \<open>recfn 2 r_psi\<close> have "(\<lambda>i x. if x = 0 then Some i else f (x - 1)) \<in> \<P>\<^sup>2"
+    by auto
+  with kleene_fixed_point obtain i where
+    "\<phi> i = (\<lambda>x. if x = 0 then Some i else f (x - 1))"
+    by blast
+  then have "\<phi> i = [i] \<odot> f" by auto
+  then show ?thesis by auto
+qed
+
+lemma V0_in_FIN_minus_NUM: "V\<^sub>0 \<in> FIN - NUM"
+proof -
+  have "V\<^sub>0 \<notin> NUM"
+  proof
+    assume "V\<^sub>0 \<in> NUM"
+    then obtain \<psi> where \<psi>: "\<psi> \<in> \<R>\<^sup>2" "\<And>f. f \<in> V\<^sub>0 \<Longrightarrow> \<exists>i. \<psi> i = f"
+      by auto
+    define \<psi>' where "\<psi>' i x = \<psi> i (Suc x)" for i x
+    have "\<psi>' \<in> \<R>\<^sup>2"
+    proof
+      from \<psi>(1) obtain r_psi where
+        r_psi: "recfn 2 r_psi" "total r_psi" "\<And>i x. eval r_psi [i, x] = \<psi> i x"
+        by blast
+      define r_psi' where "r_psi' = Cn 2 r_psi [Id 2 0, Cn 2 S [Id 2 1]]"
+      then have "recfn 2 r_psi'" and "\<And>i x. eval r_psi' [i, x] = \<psi>' i x"
+        unfolding r_psi'_def \<psi>'_def using r_psi by simp_all
+      then show "\<psi>' \<in> \<P>\<^sup>2" by blast
+      show "total2 \<psi>'"
+        using \<psi>'_def \<psi>(1) by (simp add: total2I)
+    qed
+    have "\<exists>i. \<psi>' i = f" if "f \<in> \<R>" for f
+    proof -
+      from that obtain j where j: "\<phi> j = [j] \<odot> f"
+        using prepend_goedel by auto
+      then have "\<phi> j \<in> V\<^sub>0"
+        using that V0_altdef by auto
+      with \<psi> obtain i where "\<psi> i = \<phi> j" by auto
+      then have "\<psi>' i = f"
+        using \<psi>'_def j by (auto simp add: prepend_at_ge)
+      then show ?thesis by auto
+    qed
+    with \<open>\<psi>' \<in> \<R>\<^sup>2\<close> have "\<R> \<in> NUM" by auto
+    with R1_not_in_NUM show False by simp
+  qed
+  then show ?thesis
+    using V0_in_FIN by auto
+qed
+
+corollary FIN_not_subseteq_NUM: "\<not> FIN \<subseteq> NUM"
+  using V0_in_FIN_minus_NUM by auto
+
+
+section \<open>NUM and CP are incomparable\label{s:num_cp}\<close>
+
+text \<open>There are FIN classes outside of NUM, and CP encompasses FIN.
+Hence there are CP classes outside of NUM, too.\<close>
+
+theorem CP_not_subseteq_NUM: "\<not> CP \<subseteq> NUM"
+  using FIN_subseteq_CP FIN_not_subseteq_NUM by blast
+
+text \<open>Conversely there is a subclass of @{term "U\<^sub>0"} that
+is in NUM but cannot be learned in a class-preserving way. The following
+proof is due to Jantke and Beick~\cite{jb-cpnii-81}. The idea is to
+diagonalize against all strategies, that is, all partial recursive
+functions.\<close>
+
+theorem NUM_not_subseteq_CP: "\<not> NUM \<subseteq> CP"
+proof-
+  \<comment> \<open>Define a family of functions $f_k$.\<close>
+  define f where "f \<equiv> \<lambda>k. [k] \<odot> 0\<^sup>\<infinity>"
+  then have "f k \<in> \<R>" for k
+    using almost0_in_R1 by auto
+
+  \<comment> \<open>If the strategy $\varphi_k$ learns $f_k$ it hypothesizes
+  $f_k$ for some shortest prefix $f_k^{a_k}$. Define functions $f'_k =
+  k0^{a_k}10^\infty$.\<close>
+  define a where
+    "a \<equiv> \<lambda>k. LEAST x. (\<phi> (the ((\<phi> k) ((f k) \<triangleright> x)))) = f k"
+  define f' where "f' \<equiv> \<lambda>k. (k # (replicate (a k) 0) @ [1]) \<odot> 0\<^sup>\<infinity>"
+  then have "f' k \<in> \<R>" for k
+    using almost0_in_R1 by auto
+
+  \<comment> \<open>Although $f_k$ and $f'_k$ differ, they share the prefix of length $a_k + 1$.\<close>
+  have init_eq: "(f' k) \<triangleright> (a k) = (f k) \<triangleright> (a k)" for k
+  proof (rule init_eqI)
+    fix x assume "x \<le> a k"
+    then show "f' k x = f k x"
+      by (cases "x = 0") (simp_all add: nth_append f'_def f_def)
+  qed
+  have "f k \<noteq> f' k" for k
+  proof -
+    have "f k (Suc (a k)) \<down>= 0" using f_def by auto
+    moreover have "f' k (Suc (a k)) \<down>= 1"
+      using f'_def prepend[of "(k # (replicate (a k) 0) @ [1])" "0\<^sup>\<infinity>" "Suc (a k)"]
+      by (metis length_Cons length_append_singleton length_replicate lessI nth_Cons_Suc
+        nth_append_length)
+    ultimately show ?thesis by auto
+  qed
+
+  \<comment> \<open>The separating class $U$ contains $f'_k$ if $\varphi_k$
+  learns $f_k$; otherwise it contains $f_k$.\<close>
+  define U where
+    "U \<equiv> {if learn_lim \<phi> {f k} (\<phi> k) then f' k else f k |k. k \<in> UNIV}"
+  have "U \<notin> CP"
+  proof
+    assume "U \<in> CP"
+    have "\<exists>k. learn_cp \<phi> U (\<phi> k)"
+    proof -
+      have "\<exists>\<psi> s. learn_cp \<psi> U s"
+        using CP_def `U \<in> CP` by auto
+      then obtain s where s: "learn_cp \<phi> U s"
+        using learn_cp_wrt_goedel[OF goedel_numbering_phi] by blast
+      then obtain k where "\<phi> k = s"
+        using phi_universal learn_cp_def learn_lim_def by auto
+      then show ?thesis using s by auto
+    qed
+    then obtain k where k: "learn_cp \<phi> U (\<phi> k)" by auto
+    then have learn: "learn_lim \<phi> U (\<phi> k)"
+      using learn_cp_def by simp
+    \<comment> \<open>If $f_k$ was in $U$, $\varphi_k$ would learn it. But then,
+    by definition of $U$, $f_k$ would not be in $U$. Hence $f_k \notin U$.\<close>
+    have "f k \<notin> U"
+    proof
+      assume "f k \<in> U"
+      then obtain m where m: "f k = (if learn_lim \<phi> {f m} (\<phi> m) then f' m else f m)"
+        using U_def by auto
+      have "f k 0 \<down>= m"
+        using f_def f'_def m by simp
+      moreover have "f k 0 \<down>= k" by (simp add: f_def)
+      ultimately have "m = k" by simp
+      with m have "f k = (if learn_lim \<phi> {f k} (\<phi> k) then f' k else f k)"
+        by auto
+      moreover have "learn_lim \<phi> {f k} (\<phi> k)"
+        using \<open>f k \<in> U\<close> learn_lim_closed_subseteq[OF learn] by simp
+      ultimately have "f k = f' k"
+        by simp
+      then show False
+        using \<open>f k \<noteq> f' k\<close> by simp
+    qed
+    then have "f' k \<in> U" using U_def by fastforce
+    then have in_U: "\<forall>n. \<phi> (the ((\<phi> k) ((f' k) \<triangleright> n))) \<in> U"
+      using learn_cpE(3)[OF k] by simp
+
+    \<comment> \<open>Since $f'_k \in U$, the strategy $\varphi_k$ learns $f_k$.
+    Then $a_k$ is well-defined, $f'^{a_k} = f^{a_k}$, and $\varphi_k$
+    hypothesizes $f_k$ on $f'^{a_k}$, which is not a class-preserving
+    hypothesis.\<close>
+    have "learn_lim \<phi> {f k} (\<phi> k)" using U_def \<open>f k \<notin> U\<close> by fastforce
+    then have "\<exists>i n\<^sub>0. \<phi> i = f k \<and> (\<forall>n\<ge>n\<^sub>0. \<phi> k ((f k) \<triangleright> n) \<down>= i)"
+      using learn_limE(2) by simp
+    then obtain i n\<^sub>0 where "\<phi> i = f k \<and> (\<forall>n\<ge>n\<^sub>0. \<phi> k ((f k) \<triangleright> n) \<down>= i)"
+      by auto
+    then have "\<phi> (the (\<phi> k ((f k) \<triangleright> (a k)))) = f k"
+      using a_def LeastI[of "\<lambda>x. (\<phi> (the ((\<phi> k) ((f k) \<triangleright> x)))) = f k" n\<^sub>0]
+      by simp
+    then have "\<phi> (the ((\<phi> k) ((f' k) \<triangleright> (a k)))) = f k"
+      using init_eq by simp
+    then show False
+      using \<open>f k \<notin> U\<close> in_U by metis
+  qed
+  moreover have "U \<in> NUM"
+    using NUM_closed_subseteq[OF U0_in_NUM, of U] f_def f'_def U0_def U_def
+    by fastforce
+  ultimately show ?thesis by auto
+qed
+
+
+section \<open>NUM is a proper subset of TOTAL\label{s:num_total}\<close>
+
+text \<open>A NUM class $U$ is embedded in a total numbering @{term \<psi>}.
+The strategy $S$ with $S(f^n) = \min \{i \mid \forall k \le n: \psi_i(k) =
+f(k)\}$ for $f \in U$ converges to the least index of $f$ in @{term \<psi>},
+and thus learns $f$ in the limit. Moreover it will be a TOTAL strategy
+because @{term \<psi>} contains only total functions. This shows @{prop "NUM
+\<subseteq> TOTAL"}.\<close>
+
+text \<open>First we define, for every hypothesis space $\psi$, a
+function that tries to determine for a given list $e$ and index $i$ whether
+$e$ is a prefix of $\psi_i$. In other words it tries to decide whether $i$ is
+a consistent hypothesis for $e$. ``Tries'' refers to the fact that the
+function will diverge if $\psi_i(x)\uparrow$ for any $x \le |e|$. We start
+with a version that checks the list only up to a given length.\<close>
+
+definition r_consist_upto :: "recf \<Rightarrow> recf" where
+  "r_consist_upto r_psi \<equiv>
+    let g = Cn 4 r_ifeq
+      [Cn 4 r_psi [Id 4 2, Id 4 0], Cn 4 r_nth [Id 4 3, Id 4 0], Id 4 1, r_constn 3 1]
+    in Pr 2 (r_constn 1 0) g"
+
+lemma r_consist_upto_recfn: "recfn 2 r_psi \<Longrightarrow> recfn 3 (r_consist_upto r_psi)"
+  using r_consist_upto_def by simp
+
+lemma r_consist_upto:
+  assumes "recfn 2 r_psi"
+  shows "\<forall>k<j. eval r_psi [i, k] \<down> \<Longrightarrow>
+      eval (r_consist_upto r_psi) [j, i, e] =
+        (if \<forall>k<j. eval r_psi [i, k] \<down>= e_nth e k then Some 0 else Some 1)"
+    and "\<not> (\<forall>k<j. eval r_psi [i, k] \<down>) \<Longrightarrow> eval (r_consist_upto r_psi) [j, i, e] \<up>"
+proof -
+  define g where "g =
+    Cn 4 r_ifeq
+     [Cn 4 r_psi [Id 4 2, Id 4 0], Cn 4 r_nth [Id 4 3, Id 4 0], Id 4 1, r_constn 3 1]"
+  then have "recfn 4 g"
+    using assms by simp
+  moreover have "eval (Cn 4 r_nth [Id 4 3, Id 4 0]) [j, r, i, e] \<down>= e_nth e j" for j r i e
+    by simp
+  moreover have "eval (r_constn 3 1) [j, r, i, e] \<down>= 1" for j r i e
+    by simp
+  moreover have "eval (Cn 4 r_psi [Id 4 2, Id 4 0]) [j, r, i, e] = eval r_psi [i, j]" for j r i e
+    using assms(1) by simp
+  ultimately have g: "eval g [j, r, i, e] =
+    (if eval r_psi [i, j] \<up> then None
+     else if eval r_psi [i, j] \<down>= e_nth e j then Some r else Some 1)"
+    for j r i e
+    using `recfn 4 g` g_def assms by auto
+  have goal1: "\<forall>k<j. eval r_psi [i, k] \<down> \<Longrightarrow>
+    eval (r_consist_upto r_psi) [j, i, e] =
+      (if \<forall>k<j. eval r_psi [i, k] \<down>= e_nth e k then Some 0 else Some 1)"
+    for j i e
+  proof (induction j)
+    case 0
+    then show ?case
+      using r_consist_upto_def r_consist_upto_recfn assms eval_Pr_0 by simp
+  next
+    case (Suc j)
+    then have "eval (r_consist_upto r_psi) [Suc j, i, e] =
+        eval g [j, the (eval (r_consist_upto r_psi) [j, i, e]), i, e]"
+      using assms eval_Pr_converg_Suc g_def r_consist_upto_def r_consist_upto_recfn
+      by simp
+    also have "... = eval g [j, if \<forall>k<j. eval r_psi [i, k] \<down>= e_nth e k then 0 else 1, i, e]"
+      using Suc by auto
+    also have "... \<down>= (if eval r_psi [i, j] \<down>= e_nth e j
+        then if \<forall>k<j. eval r_psi [i, k] \<down>= e_nth e k then 0 else 1 else 1)"
+      using g by (simp add: Suc.prems)
+    also have "... \<down>= (if \<forall>k<Suc j. eval r_psi [i, k] \<down>= e_nth e k then 0 else 1)"
+      by (simp add: less_Suc_eq)
+    finally show ?case by simp
+  qed
+  then show "\<forall>k<j. eval r_psi [i, k] \<down> \<Longrightarrow>
+    eval (r_consist_upto r_psi) [j, i, e] =
+    (if \<forall>k<j. eval r_psi [i, k] \<down>= e_nth e k then Some 0 else Some 1)"
+    by simp
+  show "\<not> (\<forall>k<j. eval r_psi [i, k] \<down>) \<Longrightarrow> eval (r_consist_upto r_psi) [j, i, e] \<up>"
+  proof -
+    assume "\<not> (\<forall>k<j. eval r_psi [i, k] \<down>)"
+    then have "\<exists>k<j. eval r_psi [i, k] \<up>" by simp
+    let ?P = "\<lambda>k. k < j \<and> eval r_psi [i, k] \<up>"
+    define kmin where "kmin = Least ?P"
+    then have "?P kmin"
+      using LeastI_ex[of ?P] \<open>\<exists>k<j. eval r_psi [i, k] \<up>\<close> by auto
+    from kmin_def have "\<And>k. k < kmin \<Longrightarrow> \<not> ?P k"
+      using kmin_def not_less_Least[of _ ?P] by blast
+    then have "\<forall>k < kmin. eval r_psi [i, k] \<down>"
+      using `?P kmin` by simp
+    then have "eval (r_consist_upto r_psi) [kmin, i, e] =
+        (if \<forall>k<kmin. eval r_psi [i, k] \<down>= e_nth e k then Some 0 else Some 1)"
+      using goal1 by simp
+    moreover have "eval r_psi [i, kmin] \<up>"
+      using `?P kmin` by simp
+    ultimately have "eval (r_consist_upto r_psi) [Suc kmin, i, e] \<up>"
+      using r_consist_upto_def g assms by simp
+    moreover have "j \<ge> kmin"
+      using `?P kmin` by simp
+    ultimately show "eval (r_consist_upto r_psi) [j, i, e] \<up>"
+      using r_consist_upto_def r_consist_upto_recfn `?P kmin` eval_Pr_converg_le assms
+      by (metis (full_types) Suc_leI length_Cons list.size(3) numeral_2_eq_2 numeral_3_eq_3)
+  qed
+qed
+
+text \<open>The next function provides the consistency decision functions we
+need.\<close>
+
+definition consistent :: "partial2 \<Rightarrow> partial2" where
+  "consistent \<psi> i e \<equiv>
+    if \<forall>k<e_length e. \<psi> i k \<down>
+    then if \<forall>k<e_length e. \<psi> i k \<down>= e_nth e k
+         then Some 0 else Some 1
+    else None"
+
+text \<open>Given $i$ and $e$, @{term "consistent \<psi>"} decides whether $e$
+is a prefix of $\psi_i$, provided $\psi_i$ is defined for the length of
+$e$.\<close>
+
+definition r_consistent :: "recf \<Rightarrow> recf" where
+  "r_consistent r_psi \<equiv>
+     Cn 2 (r_consist_upto r_psi) [Cn 2 r_length [Id 2 1], Id 2 0, Id 2 1]"
+
+lemma r_consistent_recfn [simp]: "recfn 2 r_psi \<Longrightarrow> recfn 2 (r_consistent r_psi)"
+  using r_consistent_def r_consist_upto_recfn by simp
+
+lemma r_consistent_converg:
+  assumes "recfn 2 r_psi" and "\<forall>k<e_length e. eval r_psi [i, k] \<down>"
+  shows "eval (r_consistent r_psi) [i, e] \<down>=
+    (if \<forall>k<e_length e. eval r_psi [i, k] \<down>= e_nth e k then 0 else 1)"
+proof -
+  have "eval (r_consistent r_psi) [i, e] = eval (r_consist_upto r_psi) [e_length e, i, e]"
+    using r_consistent_def r_consist_upto_recfn assms(1) by simp
+  then show ?thesis using assms r_consist_upto(1) by simp
+qed
+
+lemma r_consistent_diverg:
+  assumes "recfn 2 r_psi" and "\<exists>k<e_length e. eval r_psi [i, k] \<up>"
+  shows "eval (r_consistent r_psi) [i, e] \<up>"
+  unfolding r_consistent_def
+  using r_consist_upto_recfn[OF assms(1)] r_consist_upto[OF assms(1)] assms(2)
+  by simp
+
+lemma r_consistent:
+  assumes "recfn 2 r_psi" and "\<forall>x y. eval r_psi [x, y] = \<psi> x y"
+  shows "eval (r_consistent r_psi) [i, e] = consistent \<psi> i e"
+proof (cases "\<forall>k<e_length e. \<psi> i k \<down>")
+  case True
+  then have "\<forall>k<e_length e. eval r_psi [i, k] \<down>"
+    using assms by simp
+  then show ?thesis
+    unfolding consistent_def using True by (simp add: assms r_consistent_converg)
+next
+  case False
+  then have "consistent \<psi> i e \<up>"
+    unfolding consistent_def by auto
+  moreover have "eval (r_consistent r_psi) [i, e] \<up>"
+    using r_consistent_diverg[OF assms(1)] assms False by simp
+  ultimately show ?thesis by simp
+qed
+
+lemma consistent_in_P2:
+  assumes "\<psi> \<in> \<P>\<^sup>2"
+  shows "consistent \<psi> \<in> \<P>\<^sup>2"
+  using assms r_consistent P2E[OF assms(1)] P2I r_consistent_recfn by metis
+
+lemma consistent_for_R2:
+  assumes "\<psi> \<in> \<R>\<^sup>2"
+  shows "consistent \<psi> i e =
+    (if \<forall>j<e_length e. \<psi> i j \<down>= e_nth e j then Some 0 else Some 1)"
+  using assms by (simp add: consistent_def)
+
+lemma consistent_init:
+  assumes "\<psi> \<in> \<R>\<^sup>2" and "f \<in> \<R>"
+  shows "consistent \<psi> i (f \<triangleright> n) = (if \<psi> i \<triangleright> n = f \<triangleright> n then Some 0 else Some 1)"
+  using consistent_def[of _ _ "init f n"] assms  init_eq_iff_eq_upto by simp
+
+lemma consistent_in_R2:
+  assumes "\<psi> \<in> \<R>\<^sup>2"
+  shows "consistent \<psi> \<in> \<R>\<^sup>2"
+  using total2I consistent_in_P2 consistent_for_R2[OF assms] P2_total_imp_R2 R2_imp_P2 assms
+  by (metis option.simps(3))
+
+text \<open>For total hypothesis spaces the next function computes the
+minimum hypothesis consistent with a given prefix. It diverges if no such
+hypothesis exists.\<close>
+
+definition min_cons_hyp :: "partial2 \<Rightarrow> partial1" where
+  "min_cons_hyp \<psi> e \<equiv>
+    if \<exists>i. consistent \<psi> i e \<down>= 0 then Some (LEAST i. consistent \<psi> i e \<down>= 0) else None"
+
+lemma min_cons_hyp_in_P1:
+  assumes "\<psi> \<in> \<R>\<^sup>2"
+  shows "min_cons_hyp \<psi> \<in> \<P>"
+proof -
+  from assms consistent_in_R2 obtain rc where
+    rc: "recfn 2 rc" "total rc" "\<And>i e. eval rc [i, e] = consistent \<psi> i e"
+    using R2E[of "consistent \<psi>"] by metis
+  define r where "r = Mn 1 rc"
+  then have "recfn 1 r"
+    using rc(1) by simp
+  moreover from this have "eval r [e] = min_cons_hyp \<psi> e" for e
+    using r_def eval_Mn'[of 1 rc "[e]"] rc min_cons_hyp_def assms
+    by (auto simp add: consistent_in_R2)
+  ultimately show ?thesis by auto
+qed
+
+text \<open>The function @{term "min_cons_hyp \<psi>"} is a strategy for
+learning all NUM classes embedded in @{term \<psi>}. It is an example of an
+``identification-by-enumeration'' strategy.\<close>
+
+lemma NUM_imp_learn_total:
+  assumes "\<psi> \<in> \<R>\<^sup>2" and "U \<in> NUM_wrt \<psi>"
+  shows "learn_total \<psi> U (min_cons_hyp \<psi>)"
+proof (rule learn_totalI)
+  have ex_psi_i_f: "\<exists>i. \<psi> i = f" if "f \<in> U" for f
+    using assms that NUM_wrt_def by simp
+  moreover have consistent_eq_0: "consistent \<psi> i ((\<psi> i) \<triangleright> n) \<down>= 0" for i n
+    using assms by (simp add: consistent_init)
+  ultimately have "\<And>f n. f \<in> U \<Longrightarrow> min_cons_hyp \<psi> (f \<triangleright> n) \<down>"
+    using min_cons_hyp_def assms(1) by fastforce
+  then show env: "environment \<psi> U (min_cons_hyp \<psi>)"
+    using assms NUM_wrt_def min_cons_hyp_in_P1 NUM_E(1) NUM_I by auto
+
+  show "\<And>f n. f \<in> U \<Longrightarrow> \<psi> (the (min_cons_hyp \<psi> (f \<triangleright> n))) \<in> \<R>"
+    using assms by (simp)
+
+  show "\<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. min_cons_hyp \<psi> (f \<triangleright> n) \<down>= i)" if "f \<in> U" for f
+  proof -
+    from that env have "f \<in> \<R>" by auto
+
+    let ?P = "\<lambda>i. \<psi> i = f"
+    define imin where "imin \<equiv> Least ?P"
+    with ex_psi_i_f that have imin: "?P imin" "\<And>j. ?P j \<Longrightarrow> j \<ge> imin"
+      using LeastI_ex[of ?P] Least_le[of ?P] by simp_all
+    then have f_neq: "\<psi> i \<noteq> f" if "i < imin" for i
+      using leD that by auto
+
+    let ?Q = "\<lambda>i n. \<psi> i \<triangleright> n \<noteq> f \<triangleright> n"
+    define nu :: "nat \<Rightarrow> nat" where "nu = (\<lambda>i. SOME n. ?Q i n)"
+    have nu_neq: "\<psi> i \<triangleright> (nu i) \<noteq> f \<triangleright> (nu i)" if "i < imin" for i
+    proof -
+      from assms have "\<psi> i \<in> \<R>" by simp
+      moreover from assms imin(1) have "f \<in> \<R>" by auto
+      moreover have "f \<noteq> \<psi> i"
+        using that f_neq by auto
+      ultimately have "\<exists>n. f \<triangleright> n \<noteq> (\<psi> i) \<triangleright> n"
+        using neq_fun_neq_init by simp
+      then show "?Q i (nu i)"
+        unfolding nu_def using someI_ex[of "\<lambda>n. ?Q i n"] by metis
+    qed
+
+    have "\<exists>n\<^sub>0. \<forall>n\<ge>n\<^sub>0. min_cons_hyp \<psi> (f \<triangleright> n) \<down>= imin"
+    proof (cases "imin = 0")
+      case True
+      then have "\<forall>n. min_cons_hyp \<psi> (f \<triangleright> n) \<down>= imin"
+        using consistent_eq_0 assms(1) imin(1) min_cons_hyp_def by auto
+      then show ?thesis by simp
+    next
+      case False
+      define n\<^sub>0 where "n\<^sub>0 = Max (set (map nu [0..<imin]))" (is "_ = Max ?N")
+      have "nu i \<le> n\<^sub>0" if "i < imin" for i
+      proof -
+        have "finite ?N"
+          using n\<^sub>0_def by simp
+        moreover have "?N \<noteq> {}"
+          using False n\<^sub>0_def by simp
+        moreover have "nu i \<in> ?N"
+          using that by simp
+        ultimately show ?thesis
+          using that Max_ge n\<^sub>0_def by blast
+      qed
+      then have "\<psi> i \<triangleright> n\<^sub>0 \<noteq> f \<triangleright> n\<^sub>0" if "i < imin" for i
+        using nu_neq neq_init_forall_ge that by blast
+      then have *: "\<psi> i \<triangleright> n \<noteq> f \<triangleright> n" if "i < imin" and "n \<ge> n\<^sub>0" for i n
+        using nu_neq neq_init_forall_ge that by blast
+
+      have "\<psi> imin \<triangleright> n = f \<triangleright> n" for n
+        using imin(1) by simp
+      moreover have "(consistent \<psi> i (f \<triangleright> n) \<down>= 0) = (\<psi> i \<triangleright> n = f \<triangleright> n)" for i n
+        by (simp add: \<open>f \<in> \<R>\<close> assms(1) consistent_init)
+      ultimately have "min_cons_hyp \<psi> (f \<triangleright> n) \<down>= (LEAST i. \<psi> i \<triangleright> n = f \<triangleright> n)" for n
+        using min_cons_hyp_def[of \<psi> "f \<triangleright> n"] by auto
+      moreover have "(LEAST i. \<psi> i \<triangleright> n = f \<triangleright> n) = imin" if "n \<ge> n\<^sub>0" for n
+      proof (rule Least_equality)
+        show "\<psi> imin \<triangleright> n = f \<triangleright> n"
+          using imin(1) by simp
+        show "\<And>y. \<psi> y \<triangleright> n = f \<triangleright> n \<Longrightarrow> imin \<le> y"
+          using imin * leI that by blast
+      qed
+      ultimately have "min_cons_hyp \<psi> (f \<triangleright> n) \<down>= imin" if "n \<ge> n\<^sub>0" for n
+        using that by blast
+      then show ?thesis by auto
+    qed
+    with imin(1) show ?thesis by auto
+  qed
+qed
+
+corollary NUM_subseteq_TOTAL: "NUM \<subseteq> TOTAL"
+proof
+  fix U
+  assume "U \<in> NUM"
+  then have "\<exists>\<psi>\<in>\<R>\<^sup>2. \<forall>f\<in>U. \<exists>i. \<psi> i = f" by auto
+  then have "\<exists>\<psi>\<in>\<R>\<^sup>2. U \<in> NUM_wrt \<psi>"
+    using NUM_wrt_def by simp
+  then have "\<exists>\<psi> s. learn_total \<psi> U s"
+    using NUM_imp_learn_total by auto
+  then show "U \<in> TOTAL"
+    using TOTAL_def by auto
+qed
+
+text \<open>The class @{term V0} is in @{term "TOTAL - NUM"}. \<close>
+
+theorem NUM_subset_TOTAL: "NUM \<subset> TOTAL"
+  using CP_subseteq_TOTAL FIN_not_subseteq_NUM FIN_subseteq_CP NUM_subseteq_TOTAL
+  by auto
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/Inductive_Inference_Basics.thy b/thys/Inductive_Inference/Inductive_Inference_Basics.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/Inductive_Inference_Basics.thy
@@ -0,0 +1,1222 @@
+chapter \<open>Inductive inference of recursive functions\label{c:iirf}\<close>
+
+theory Inductive_Inference_Basics
+  imports Standard_Results
+begin
+
+text \<open>Inductive inference originates from work by
+Solomonoff~\cite{s-ftiip1-64,s-ftiip2-64} and Gold~\cite{g-lil-67,g-lr-65}
+and comes in many variations. The common theme is to infer additional
+information about objects, such as formal languages or functions, from incomplete
+data, such as finitely many words contained in the language or argument-value
+pairs of the function. Oftentimes ``additional information'' means complete
+information, such that the task becomes identification of the object.
+
+The basic setting in inductive inference of recursive functions is as follows.
+Let us denote, for a total function $f$, by $f^n$ the code of the list
+$[f(0), ..., f(n)]$. Let $U$ be a set (called \emph{class}) of total
+recursive functions, and $\psi$ a binary partial recursive function
+(called \emph{hypothesis space}).
+A partial recursive function $S$ (called \emph{strategy})
+is said to \emph{learn $U$ in the limit with respect to $\psi$} if
+for all $f \in U$,
+\begin{itemize}
+  \item the value $S(f^n)$ is defined for all $n\in\mathbb{N}$,
+  \item the sequence $S(f^0), S(f^1), \ldots$ converges to an
+    $i\in\mathbb{N}$ with $\psi_i = f$.
+\end{itemize}
+
+Both the output $S(f^n)$ of the strategy and its interpretation
+as a function $\psi_{S(f^n)}$ are called \emph{hypothesis}. The set
+of all classes learnable in the limit by $S$ with respect to $\psi$ is
+denoted by $\mathrm{LIM}_\psi(S)$. Moreover we set $\mathrm{LIM}_\psi =
+\bigcup_{S\in\mathcal{P}} \mathrm{LIM}_\psi(S)$ and $\mathrm{LIM} =
+\bigcup_{\psi\in\mathcal{P}^2} \mathrm{LIM}_\psi$. We call the latter set the
+\emph{inference type} $\mathrm{LIM}$.
+
+Many aspects of this setting can be varied. We shall consider:
+\begin{itemize}
+  \item Intermediate hypotheses: $\psi_{S(f^n)}$ can be required to be total or
+    to be in the class $U$, or to coincide with $f$ on arguments up to $n$, or
+    a myriad of other conditions or combinations thereof.
+  \item Convergence of hypotheses:
+  \begin{itemize}
+    \item The strategy can be required to output not a sequence but a single
+      hypothesis, which must be correct.
+    \item The strategy can be required to converge to a \emph{function} rather
+      than an index.
+  \end{itemize}
+\end{itemize}
+
+We formalize five kinds of results (\<open>\<I>\<close> and \<open>\<I>'\<close> stand for
+inference types):
+\begin{itemize}
+  \item Comparison of learning power: results of the form @{prop "\<I>
+    \<subset> \<I>'"}, in particular showing that the inclusion is proper
+    (Sections~\ref{s:fin_cp}, \ref{s:num_fin}, \ref{s:num_cp},
+    \ref{s:num_total}, \ref{s:cons_lim}, \ref{s:lim_bc}, \ref{s:total_cons},
+    \ref{s:r1_bc}).
+  \item Whether \<open>\<I>\<close> is closed under the subset relation: @{prop "U
+    \<in> \<I> \<and> V \<subseteq> U \<Longrightarrow> V \<in> \<I>"}.
+  \item Whether \<open>\<I>\<close> is closed under union: @{prop "U \<in> \<I> \<and>
+    V \<in> \<I> \<Longrightarrow> U \<union> V \<in> \<I>"} (Section~\ref{s:union}).
+  \item Whether every class in \<open>\<I>\<close> can be learned with respect to a
+    Gödel numbering as hypothesis space (Section~\ref{s:inference_types}).
+  \item Whether every class in \<open>\<I>\<close> can be learned by a \emph{total}
+    recursive strategy (Section~\ref{s:lemma_r}).
+\end{itemize}
+
+The bulk of this chapter is devoted to the first category of results. Most
+results that we are going to formalize have been called ``classical'' by
+Jantke and Beick~\cite{jb-cpnii-81}, who compare a large number of inference
+types. Another comparison is by Case and Smith~\cite{cs-cicmii-83}. Angluin
+and Smith~\cite{as-ii-87} give an overview of various forms of inductive
+inference.
+
+All (interesting) proofs herein are based on my lecture notes of the
+\emph{Induktive Inferenz} lectures by Rolf Wiehagen from 1999/2000 and
+2000/2001 at the University of Kaiserslautern. I have given references to the
+original proofs whenever I was able to find them. For the other proofs, as
+well as for those that I had to contort beyond recognition, I provide proof
+sketches.\<close>
+
+
+section \<open>Preliminaries\<close>
+
+text \<open>Throughout the chapter, in particular in proof sketches, we use
+the following notation.
+
+Let $b\in\mathbb{N}^*$ be a list of numbers. We write $|b|$ for its length
+and $b_i$ for the $i$-th element ($i=0,\dots, |b| - 1$). Concatenation of
+numbers and lists works in the obvious way; for instance, $jbk$ with
+$j,k\in\mathbb{N}$, $b\in\mathbb{N}^*$ refers to the list $jb_0\dots
+b_{|b|-1}k$. For $0 \leq i < |b|$, the term $b_{i:=v}$ denotes the list
+$b_0\dots b_{i-1}vb_{i+1}\dots b_{|b|-1}$. The notation $b_{<i}$ refers to
+$b_0\dots b_{i-1}$ for $0 < i \leq |b|$. Moreover, $v^n$ is short for the
+list consisting of $n$ times the value $v \in \mathbb{N}$.
+
+Unary partial functions can be regarded as infinite sequences consisting of
+numbers and the symbol~$\uparrow$ denoting undefinedness. We abbreviate the
+empty function by $\uparrow^\infty$ and the constant zero function by
+$0^\infty$. A function can be written as a list concatenated with a partial
+function. For example, $jb\uparrow^\infty$ is the function
+\[
+x \mapsto \left\{\begin{array}{ll}
+  j        & \mbox{if } x = 0,\\
+  b_{x-1}  & \mbox{if } 0 < x \leq |b|,\\
+  \uparrow & \mbox{otherwise,}
+\end{array}\right.
+\]
+and $jp$, where $p$ is a function, means
+\[
+x \mapsto \left\{\begin{array}{ll}
+  j      & \mbox{if } x = 0,\\
+  p(x-1) & \mbox{otherwise.}
+\end{array}\right.
+\]
+
+A \emph{numbering} is a function $\psi \in \mathcal{P}^2$.\<close>
+
+
+subsection \<open>The prefixes of a function\<close>
+
+text \<open>A \emph{prefix}, also called \emph{initial segment}, is a list of
+initial values of a function.\<close>
+
+definition prefix :: "partial1 \<Rightarrow> nat \<Rightarrow> nat list" where
+  "prefix f n \<equiv> map (\<lambda>x. the (f x)) [0..<Suc n]"
+
+lemma length_prefix [simp]: "length (prefix f n) = Suc n"
+  unfolding prefix_def by simp
+
+lemma prefix_nth [simp]:
+  assumes "k < Suc n"
+  shows "prefix f n ! k = the (f k)"
+  unfolding prefix_def using assms nth_map_upt[of k "Suc n" 0 "\<lambda>x. the (f x)"] by simp
+
+lemma prefixI:
+  assumes "length vs > 0" and "\<And>x. x < length vs \<Longrightarrow> f x \<down>= vs ! x"
+  shows "prefix f (length vs - 1) = vs"
+  using assms nth_equalityI[of "prefix f (length vs - 1)" vs] by simp
+
+lemma prefixI':
+  assumes "length vs = Suc n" and "\<And>x. x < Suc n \<Longrightarrow> f x \<down>= vs ! x"
+  shows "prefix f n = vs"
+  using assms nth_equalityI[of "prefix f (length vs - 1)" vs] by simp
+
+lemma prefixE:
+  assumes "prefix f (length vs - 1) = vs"
+    and "f \<in> \<R>"
+    and "length vs > 0"
+    and "x < length vs"
+  shows "f x \<down>= vs ! x"
+  using assms length_prefix prefix_nth[of x "length vs - 1" f] by simp
+
+lemma prefix_eqI:
+  assumes "\<And>x. x \<le> n \<Longrightarrow> f x = g x"
+  shows "prefix f n = prefix g n"
+  using assms prefix_def by simp
+
+lemma prefix_0: "prefix f 0 = [the (f 0)]"
+  using prefix_def by simp
+
+lemma prefix_Suc: "prefix f (Suc n) = prefix f n @ [the (f (Suc n))]"
+  unfolding prefix_def by simp
+
+lemma take_prefix:
+  assumes "f \<in> \<R>" and "k \<le> n"
+  shows "prefix f k = take (Suc k) (prefix f n)"
+proof -
+  let ?vs = "take (Suc k) (prefix f n)"
+  have "length ?vs = Suc k"
+    using assms(2) by simp
+  then have "\<And>x. x < length ?vs \<Longrightarrow> f x \<down>= ?vs ! x"
+    using assms by auto
+  then show ?thesis
+    using prefixI[where ?vs="?vs"] `length ?vs = Suc k` by simp
+qed
+
+text \<open>Strategies receive prefixes in the form of encoded lists. The
+term ``prefix'' refers to both encoded and unencoded lists. We use the
+notation @{text "f \<triangleright> n"} for the prefix $f^n$.\<close>
+
+definition init :: "partial1 \<Rightarrow> nat \<Rightarrow> nat" (infix "\<triangleright>" 110) where
+  "f \<triangleright> n \<equiv> list_encode (prefix f n)"
+
+lemma init_neq_zero: "f \<triangleright> n \<noteq> 0"
+  unfolding init_def prefix_def using list_encode_0 by fastforce
+
+lemma init_prefixE [elim]: "prefix f n = prefix g n \<Longrightarrow> f \<triangleright> n = g \<triangleright> n"
+  unfolding init_def by simp
+
+lemma init_eqI:
+  assumes "\<And>x. x \<le> n \<Longrightarrow> f x = g x"
+  shows "f \<triangleright> n = g \<triangleright> n"
+  unfolding init_def using prefix_eqI[OF assms] by simp
+
+lemma initI:
+  assumes "e_length e > 0" and "\<And>x. x < e_length e \<Longrightarrow> f x \<down>= e_nth e x"
+  shows "f \<triangleright> (e_length e - 1) = e"
+  unfolding init_def using assms prefixI by simp
+
+lemma initI':
+  assumes "e_length e = Suc n" and "\<And>x. x <  Suc n \<Longrightarrow> f x \<down>= e_nth e x"
+  shows "f \<triangleright> n = e"
+  unfolding init_def using assms prefixI' by simp
+
+lemma init_iff_list_eq_upto:
+  assumes "f \<in> \<R>" and "e_length vs > 0"
+  shows "(\<forall>x<e_length vs. f x \<down>= e_nth vs x) \<longleftrightarrow> prefix f (e_length vs - 1) = list_decode vs"
+  using prefixI[OF assms(2)] prefixE[OF _ assms] by auto
+
+lemma length_init [simp]: "e_length (f \<triangleright> n) = Suc n"
+  unfolding init_def by simp
+
+lemma init_Suc_snoc: "f \<triangleright> (Suc n) = e_snoc (f \<triangleright> n) (the (f (Suc n)))"
+  unfolding init_def by (simp add: prefix_Suc)
+
+lemma nth_init: "i < Suc n \<Longrightarrow> e_nth (f \<triangleright> n) i = the (f i)"
+  unfolding init_def using prefix_nth by auto
+
+lemma hd_init [simp]: "e_hd (f \<triangleright> n) = the (f 0)"
+  unfolding init_def using init_neq_zero by (simp add: e_hd_nth0)
+
+lemma list_decode_init [simp]: "list_decode (f \<triangleright> n) = prefix f n"
+  unfolding init_def by simp
+
+lemma init_eq_iff_eq_upto:
+  assumes "g \<in> \<R>" and "f \<in> \<R>"
+  shows "(\<forall>j<Suc n. g j = f j) \<longleftrightarrow> g \<triangleright> n = f \<triangleright> n"
+  using assms initI' init_iff_list_eq_upto length_init list_decode_init
+  by (metis diff_Suc_1 zero_less_Suc)
+
+definition is_init_of :: "nat \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "is_init_of t f \<equiv> \<forall>i<e_length t. f i \<down>= e_nth t i"
+
+lemma not_initial_imp_not_eq:
+  assumes "\<And>x. x < Suc n \<Longrightarrow> f x \<down>" and "\<not> (is_init_of (f \<triangleright> n) g)"
+  shows "f \<noteq> g"
+  using is_init_of_def assms by auto
+
+lemma all_init_eq_imp_fun_eq:
+  assumes "f \<in> \<R>" and "g \<in> \<R>" and "\<And>n. f \<triangleright> n = g \<triangleright> n"
+  shows "f = g"
+proof
+  fix n
+  from assms have "prefix f n = prefix g n"
+    by (metis init_def list_decode_encode)
+  then have "the (f n) = the (g n)"
+    unfolding init_def prefix_def by simp
+  then show "f n = g n"
+    using assms(1,2) by (meson R1_imp_total1 option.expand total1E)
+qed
+
+corollary neq_fun_neq_init:
+  assumes "f \<in> \<R>" and "g \<in> \<R>" and "f \<noteq> g"
+  shows "\<exists>n. f \<triangleright> n \<noteq> g \<triangleright> n"
+  using assms all_init_eq_imp_fun_eq by auto
+
+lemma eq_init_forall_le:
+  assumes "f \<triangleright> n = g \<triangleright> n" and "m \<le> n"
+  shows "f \<triangleright> m = g \<triangleright> m"
+proof -
+  from assms(1) have "prefix f n = prefix g n"
+    by (metis init_def list_decode_encode)
+  then have "the (f k) = the (g k)" if "k \<le> n" for k
+    using prefix_def that by auto
+  then have "the (f k) = the (g k)" if "k \<le> m" for k
+    using assms(2) that by simp
+  then have "prefix f m = prefix g m"
+    using prefix_def by simp
+  then show ?thesis by (simp add: init_def)
+qed
+
+corollary neq_init_forall_ge:
+  assumes "f \<triangleright> n \<noteq> g \<triangleright> n" and "m \<ge> n"
+  shows "f \<triangleright> m \<noteq> g \<triangleright> m"
+  using eq_init_forall_le assms by blast
+
+lemma e_take_init:
+  assumes "f \<in> \<R>" and "k < Suc n"
+  shows "e_take (Suc k) (f \<triangleright> n) = f \<triangleright> k"
+  using assms take_prefix by (simp add: init_def less_Suc_eq_le)
+
+lemma init_butlast_init:
+  assumes "total1 f" and "f \<triangleright> n = e" and "n > 0"
+  shows "f \<triangleright> (n - 1) = e_butlast e"
+proof -
+  let ?e = "e_butlast e"
+  have "e_length e = Suc n"
+    using assms(2) by auto
+  then have len: "e_length ?e = n"
+    by simp
+  have "f \<triangleright> (e_length ?e - 1) = ?e"
+  proof (rule initI)
+    show "0 < e_length ?e"
+      using assms(3) len by simp
+    have "\<And>x. x < e_length e \<Longrightarrow> f x \<down>= e_nth e x"
+      using assms(1,2) total1_def \<open>e_length e = Suc n\<close> by auto
+    then show "\<And>x. x < e_length ?e \<Longrightarrow> f x \<down>= e_nth ?e x"
+      by (simp add: butlast_conv_take)
+  qed
+  with len show ?thesis by simp
+qed
+
+text \<open>Some definitions make use of recursive predicates, that is,
+$01$-valued functions.\<close>
+
+definition RPred1 :: "partial1 set" ("\<R>\<^sub>0\<^sub>1") where
+  "\<R>\<^sub>0\<^sub>1 \<equiv> {f. f \<in> \<R> \<and> (\<forall>x. f x \<down>= 0 \<or> f x \<down>= 1)}"
+
+lemma RPred1_subseteq_R1: "\<R>\<^sub>0\<^sub>1 \<subseteq> \<R>"
+  unfolding RPred1_def by auto
+
+lemma const0_in_RPred1: "(\<lambda>_. Some 0) \<in> \<R>\<^sub>0\<^sub>1"
+  using RPred1_def const_in_Prim1 by fast
+
+lemma RPred1_altdef: "\<R>\<^sub>0\<^sub>1 = {f. f \<in> \<R> \<and> (\<forall>x. the (f x) \<le> 1)}"
+  (is "\<R>\<^sub>0\<^sub>1 = ?S")
+proof
+  show "\<R>\<^sub>0\<^sub>1 \<subseteq> ?S"
+  proof
+    fix f
+    assume f: "f \<in> \<R>\<^sub>0\<^sub>1"
+    with RPred1_def have "f \<in> \<R>" by auto
+    from f have "\<forall>x. f x \<down>= 0 \<or> f x \<down>= 1"
+      by (simp add: RPred1_def)
+    then have "\<forall>x. the (f x) \<le> 1"
+      by (metis eq_refl less_Suc_eq_le zero_less_Suc option.sel)
+    with `f \<in> \<R>` show "f \<in> ?S" by simp
+  qed
+  show "?S \<subseteq> \<R>\<^sub>0\<^sub>1"
+  proof
+    fix f
+    assume f: "f \<in> ?S"
+    then have "f \<in> \<R>" by simp
+    then have total: "\<And>x. f x \<down>" by auto
+    from f have "\<forall>x. the (f x) = 0 \<or> the (f x) = 1"
+      by (simp add: le_eq_less_or_eq)
+    with total have "\<forall>x. f x \<down>= 0 \<or> f x \<down>= 1"
+      by (metis option.collapse)
+    then show "f \<in> \<R>\<^sub>0\<^sub>1"
+      using `f \<in> \<R>` RPred1_def by auto
+  qed
+qed
+
+subsection \<open>NUM\<close>
+
+text \<open>A class of recursive functions is in NUM if it can be
+embedded in a total numbering. Thus, for learning such classes there is
+always a total hypothesis space available.\<close>
+
+definition NUM :: "partial1 set set" where
+  "NUM \<equiv> {U. \<exists>\<psi>\<in>\<R>\<^sup>2. \<forall>f\<in>U. \<exists>i. \<psi> i = f}"
+
+definition NUM_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "\<psi> \<in> \<R>\<^sup>2 \<Longrightarrow> NUM_wrt \<psi> \<equiv> {U. \<forall>f\<in>U. \<exists>i. \<psi> i = f}"
+
+lemma NUM_I [intro]:
+  assumes "\<psi> \<in> \<R>\<^sup>2" and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<psi> i = f"
+  shows "U \<in> NUM"
+  using assms NUM_def by blast
+
+lemma NUM_E [dest]:
+  assumes "U \<in> NUM"
+  shows "U \<subseteq> \<R>"
+    and "\<exists>\<psi>\<in>\<R>\<^sup>2. \<forall>f\<in>U. \<exists>i. \<psi> i = f"
+  using NUM_def assms by (force, auto)
+
+lemma NUM_closed_subseteq:
+  assumes "U \<in> NUM" and "V \<subseteq> U"
+  shows "V \<in> NUM"
+  using assms subset_eq[of V U] NUM_I by auto
+
+text \<open>This is the classical diagonalization proof showing that there is
+no total numbering containing all total recursive functions.\<close>
+
+lemma R1_not_in_NUM: "\<R> \<notin> NUM"
+proof
+  assume "\<R> \<in> NUM"
+  then obtain \<psi> where num: "\<psi> \<in> \<R>\<^sup>2" "\<forall>f\<in>\<R>. \<exists>i. \<psi> i = f"
+    by auto
+  then obtain psi where psi: "recfn 2 psi" "total psi" "eval psi [i, x] = \<psi> i x" for i x
+    by auto
+  define d where "d = Cn 1 S [Cn 1 psi [Id 1 0, Id 1 0]]"
+  then have "recfn 1 d"
+    using psi(1) by simp
+  moreover have d: "eval d [x] \<down>= Suc (the (\<psi> x x))" for x
+    unfolding d_def using num psi by simp
+  ultimately have "(\<lambda>x. eval d [x]) \<in> \<R>"
+    using R1I by blast
+  then obtain i where "\<psi> i = (\<lambda>x. eval d [x])"
+    using num(2) by auto
+  then have "\<psi> i i = eval d [i]" by simp
+  with d have "\<psi> i i \<down>= Suc (the (\<psi> i i))" by simp
+  then show False
+    using option.sel[of "Suc (the (\<psi> i i))"] by simp
+qed
+
+text \<open>A hypothesis space that contains a function for every prefix will
+come in handy. The following is a total numbering with this property.\<close>
+
+definition "r_prenum \<equiv>
+  Cn 2 r_ifless [Id 2 1, Cn 2 r_length [Id 2 0], Cn 2 r_nth [Id 2 0, Id 2 1], r_constn 1 0]"
+
+lemma r_prenum_prim [simp]: "prim_recfn 2 r_prenum"
+  unfolding r_prenum_def by simp_all
+
+lemma r_prenum [simp]:
+  "eval r_prenum [e, x] \<down>= (if x < e_length e then e_nth e x else 0)"
+  by (simp add: r_prenum_def)
+
+definition prenum :: partial2 where
+  "prenum e x \<equiv> Some (if x < e_length e then e_nth e x else 0)"
+
+lemma prenum_in_R2: "prenum \<in> \<R>\<^sup>2"
+  using prenum_def Prim2I[OF r_prenum_prim, of prenum] by simp
+
+lemma prenum [simp]: "prenum e x \<down>= (if x < e_length e then e_nth e x else 0)"
+  unfolding prenum_def ..
+
+lemma prenum_encode:
+  "prenum (list_encode vs) x \<down>= (if x < length vs then vs ! x else 0)"
+  using prenum_def by (cases "x < length vs") simp_all
+
+text \<open>Prepending a list of numbers to a function:\<close>
+
+definition prepend :: "nat list \<Rightarrow> partial1 \<Rightarrow> partial1" (infixr "\<odot>" 64) where
+  "vs \<odot> f \<equiv> \<lambda>x. if x < length vs then Some (vs ! x) else f (x - length vs)"
+
+lemma prepend [simp]:
+  "(vs \<odot> f) x = (if x < length vs then Some (vs ! x) else f (x - length vs))"
+  unfolding prepend_def ..
+
+lemma prepend_total: "total1 f \<Longrightarrow> total1 (vs \<odot> f)"
+  unfolding total1_def by simp
+
+lemma prepend_at_less:
+  assumes "n < length vs"
+  shows "(vs \<odot> f) n \<down>= vs ! n"
+  using assms by simp
+
+lemma prepend_at_ge:
+  assumes "n \<ge> length vs"
+  shows "(vs \<odot> f) n = f (n - length vs)"
+  using assms by simp
+
+lemma prefix_prepend_less:
+  assumes "n < length vs"
+  shows "prefix (vs \<odot> f) n = take (Suc n) vs"
+  using assms length_prefix by (intro nth_equalityI) simp_all
+
+lemma prepend_eqI:
+  assumes "\<And>x. x < length vs \<Longrightarrow> g x \<down>= vs ! x"
+    and "\<And>x. g (length vs + x) = f x"
+  shows "g = vs \<odot> f"
+proof
+  fix x
+  show "g x = (vs \<odot> f) x"
+  proof (cases "x < length vs")
+    case True
+    then show ?thesis using assms by simp
+  next
+    case False
+    then show ?thesis
+      using assms prepend by (metis add_diff_inverse_nat)
+  qed
+qed
+
+fun r_prepend :: "nat list \<Rightarrow> recf \<Rightarrow> recf" where
+  "r_prepend [] r = r"
+| "r_prepend (v # vs) r =
+     Cn 1 (r_lifz (r_const v) (Cn 1 (r_prepend vs r) [r_dec])) [Id 1 0, Id 1 0]"
+
+lemma r_prepend_recfn:
+  assumes "recfn 1 r"
+  shows "recfn 1 (r_prepend vs r)"
+  using assms by (induction vs) simp_all
+
+lemma r_prepend:
+  assumes "recfn 1 r"
+  shows "eval (r_prepend vs r) [x] =
+    (if x < length vs then Some (vs ! x) else eval r [x - length vs])"
+proof (induction vs arbitrary: x)
+  case Nil
+  then show ?case using assms by simp
+next
+  case (Cons v vs)
+  show ?case
+    using assms Cons by (cases "x = 0") (auto simp add: r_prepend_recfn)
+qed
+
+lemma r_prepend_total:
+  assumes "recfn 1 r" and "total r"
+  shows "eval (r_prepend vs r) [x] \<down>=
+    (if x < length vs then vs ! x else the (eval r [x - length vs]))"
+proof (induction vs arbitrary: x)
+  case Nil
+  then show ?case using assms by simp
+next
+  case (Cons v vs)
+  show ?case
+    using assms Cons by (cases "x = 0") (auto simp add: r_prepend_recfn)
+qed
+
+lemma prepend_in_P1:
+  assumes "f \<in> \<P>"
+  shows "vs \<odot> f \<in> \<P>"
+proof -
+  obtain r where r: "recfn 1 r"  "\<And>x. eval r [x] = f x"
+    using assms by auto
+  moreover have "recfn 1 (r_prepend vs r)"
+    using r r_prepend_recfn by simp
+  moreover have "eval (r_prepend vs r) [x] = (vs \<odot> f) x" for x
+    using r r_prepend by simp
+  ultimately show ?thesis by blast
+qed
+
+lemma prepend_in_R1:
+  assumes "f \<in> \<R>"
+  shows "vs \<odot> f \<in> \<R>"
+proof -
+  obtain r where r: "recfn 1 r" "total r" "\<And>x. eval r [x] = f x"
+    using assms by auto
+  then have "total1 f"
+    using R1_imp_total1[OF assms] by simp
+  have "total (r_prepend vs r)"
+    using r r_prepend_total r_prepend_recfn totalI1[of "r_prepend vs r"] by simp
+  with r have "total (r_prepend vs r)" by simp
+  moreover have "recfn 1 (r_prepend vs r)"
+    using r r_prepend_recfn by simp
+  moreover have "eval (r_prepend vs r) [x] = (vs \<odot> f) x" for x
+    using r r_prepend `total1 f` total1E by simp
+  ultimately show ?thesis by auto
+qed
+
+lemma prepend_associative: "(us @ vs) \<odot> f = us \<odot> vs \<odot> f" (is "?lhs = ?rhs")
+proof
+  fix x
+  consider
+      "x < length us"
+    | "x \<ge> length us \<and> x < length (us @ vs)"
+    | "x \<ge> length (us @ vs)"
+    by linarith
+  then show "?lhs x = ?rhs x"
+  proof (cases)
+    case 1
+    then show ?thesis
+      by (metis le_add1 length_append less_le_trans nth_append prepend_at_less)
+  next
+    case 2
+    then show ?thesis
+      by (smt add_diff_inverse_nat add_less_cancel_left length_append nth_append prepend)
+  next
+    case 3
+    then show ?thesis
+      using prepend_at_ge by auto
+  qed
+qed
+
+abbreviation constant_divergent :: partial1 ("\<up>\<^sup>\<infinity>") where
+  "\<up>\<^sup>\<infinity> \<equiv> \<lambda>_. None"
+
+abbreviation constant_zero :: partial1 ("0\<^sup>\<infinity>") where
+  "0\<^sup>\<infinity> \<equiv> \<lambda>_. Some 0"
+
+lemma almost0_in_R1: "vs \<odot> 0\<^sup>\<infinity> \<in> \<R>"
+  using RPred1_subseteq_R1 const0_in_RPred1 prepend_in_R1 by auto
+
+text \<open>The class $U_0$ of all total recursive functions that are almost
+everywhere zero will be used several times to construct
+(counter-)examples.\<close>
+
+definition U0 :: "partial1 set" ("U\<^sub>0") where
+  "U\<^sub>0 \<equiv> {vs \<odot> 0\<^sup>\<infinity> |vs. vs \<in> UNIV}"
+
+text \<open>The class @{term U0} contains exactly the functions in the
+numbering @{term prenum}.\<close>
+
+lemma U0_altdef: "U\<^sub>0 = {prenum e| e. e \<in> UNIV}" (is "U\<^sub>0 = ?W")
+proof
+  show "U\<^sub>0 \<subseteq> ?W"
+  proof
+    fix f
+    assume "f \<in> U\<^sub>0"
+    with U0_def obtain vs where "f = vs \<odot> 0\<^sup>\<infinity>"
+      by auto
+    then have "f = prenum (list_encode vs)"
+      using prenum_encode by auto
+    then show "f \<in> ?W" by auto
+  qed
+  show "?W \<subseteq> U\<^sub>0"
+    unfolding U0_def by fastforce
+qed
+
+lemma U0_in_NUM: "U\<^sub>0 \<in> NUM"
+  using prenum_in_R2 U0_altdef by (intro NUM_I[of prenum]; force)
+
+text \<open>Every almost-zero function can be represented by $v0^\infty$ for
+a list $v$ not ending in zero.\<close>
+
+lemma almost0_canonical:
+  assumes "f = vs \<odot> 0\<^sup>\<infinity>" and "f \<noteq> 0\<^sup>\<infinity>"
+  obtains ws where "length ws > 0" and "last ws \<noteq> 0" and "f = ws \<odot> 0\<^sup>\<infinity>"
+proof -
+  let ?P = "\<lambda>k. k < length vs \<and> vs ! k \<noteq> 0"
+  from assms have "vs \<noteq> []"
+    by auto
+  then have ex: "\<exists>k<length vs. vs ! k \<noteq> 0"
+    using assms by auto
+  define m where "m = Greatest ?P"
+  moreover have le: "\<forall>y. ?P y \<longrightarrow> y \<le> length vs"
+    by simp
+  ultimately have "?P m"
+    using ex GreatestI_ex_nat[of ?P "length vs"] by simp
+  have not_gr: "\<not> ?P k" if "k > m" for k
+    using Greatest_le_nat[of ?P _ "length vs"] m_def ex le not_less that by blast
+  let ?ws = "take (Suc m) vs"
+  have "vs \<odot> 0\<^sup>\<infinity> = ?ws \<odot> 0\<^sup>\<infinity>"
+  proof
+    fix x
+    show "(vs \<odot> 0\<^sup>\<infinity>) x = (?ws \<odot> 0\<^sup>\<infinity>) x"
+    proof (cases "x < Suc m")
+      case True
+      then show ?thesis using `?P m` by simp
+    next
+      case False
+      moreover from this have "(?ws \<odot> 0\<^sup>\<infinity>) x \<down>= 0"
+        by simp
+      ultimately show ?thesis
+        using not_gr by (cases "x < length vs") simp_all
+    qed
+  qed
+  then have "f = ?ws \<odot> 0\<^sup>\<infinity>"
+    using assms(1) by simp
+  moreover have "length ?ws > 0"
+    by (simp add: \<open>vs \<noteq> []\<close>)
+  moreover have "last ?ws \<noteq> 0"
+    by (simp add: \<open>?P m\<close> take_Suc_conv_app_nth)
+  ultimately show ?thesis using that by blast
+qed
+
+
+section \<open>Types of inference\label{s:inference_types}\<close>
+
+text \<open>This section introduces all inference types that we are going to
+consider together with some of their simple properties. All these inference
+types share the following condition, which essentially says that everything
+must be computable:\<close>
+
+abbreviation environment :: "partial2 \<Rightarrow> (partial1 set) \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "environment \<psi> U s \<equiv> \<psi> \<in> \<P>\<^sup>2 \<and> U \<subseteq> \<R> \<and> s \<in> \<P> \<and> (\<forall>f\<in>U. \<forall>n. s (f \<triangleright> n) \<down>)"
+
+
+subsection \<open>LIM: Learning in the limit\<close>
+
+text \<open>A strategy $S$ learns a class $U$ in the limit with respect to a
+hypothesis space @{term "\<psi> \<in> \<P>\<^sup>2"} if for all $f\in U$, the
+sequence $(S(f^n))_{n\in\mathbb{N}}$ converges to an $i$ with $\psi_i = f$.
+Convergence for a sequence of natural numbers means that almost all elements
+are the same. We express this with the following notation.\<close>
+
+abbreviation Almost_All :: "(nat \<Rightarrow> bool) \<Rightarrow> bool" (binder "\<forall>\<^sup>\<infinity>" 10) where
+  "\<forall>\<^sup>\<infinity>n. P n \<equiv> \<exists>n\<^sub>0. \<forall>n\<ge>n\<^sub>0. P n"
+
+definition learn_lim :: "partial2 \<Rightarrow> (partial1 set) \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "learn_lim \<psi> U s \<equiv>
+     environment \<psi> U s \<and>
+     (\<forall>f\<in>U. \<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i))"
+
+lemma learn_limE:
+  assumes "learn_lim \<psi> U s"
+  shows "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)"
+  using assms learn_lim_def by auto
+
+lemma learn_limI:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)"
+  shows "learn_lim \<psi> U s"
+  using assms learn_lim_def by auto
+
+definition LIM_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "LIM_wrt \<psi> \<equiv> {U. \<exists>s. learn_lim \<psi> U s}"
+
+definition Lim :: "partial1 set set" ("LIM") where
+  "LIM \<equiv> {U. \<exists>\<psi> s. learn_lim \<psi> U s}"
+
+text \<open>LIM is closed under the the subset relation.\<close>
+
+lemma learn_lim_closed_subseteq:
+  assumes "learn_lim \<psi> U s" and "V \<subseteq> U"
+  shows "learn_lim \<psi> V s"
+  using assms learn_lim_def by auto
+
+corollary LIM_closed_subseteq:
+  assumes "U \<in> LIM" and "V \<subseteq> U"
+  shows "V \<in> LIM"
+  using assms learn_lim_closed_subseteq by (smt Lim_def mem_Collect_eq)
+
+text \<open>Changing the hypothesis infinitely often precludes learning in
+the limit.\<close>
+
+lemma infinite_hyp_changes_not_Lim:
+  assumes "f \<in> U" and "\<forall>n. \<exists>m\<^sub>1>n. \<exists>m\<^sub>2>n. s (f \<triangleright> m\<^sub>1) \<noteq> s (f \<triangleright> m\<^sub>2)"
+  shows "\<not> learn_lim \<psi> U s"
+  using assms learn_lim_def by (metis less_imp_le)
+
+lemma always_hyp_change_not_Lim:
+  assumes "\<And>x. s (f \<triangleright> (Suc x)) \<noteq> s (f \<triangleright> x)"
+  shows "\<not> learn_lim \<psi> {f} s"
+  using assms learn_limE by (metis le_SucI order_refl singletonI)
+
+text \<open>Guessing a wrong hypothesis infinitely often precludes learning
+in the limit.\<close>
+
+lemma infinite_hyp_wrong_not_Lim:
+  assumes "f \<in> U" and "\<forall>n. \<exists>m>n. \<psi> (the (s (f \<triangleright> m))) \<noteq> f"
+  shows "\<not> learn_lim \<psi> U s"
+  using assms learn_limE by (metis less_imp_le option.sel)
+
+text \<open>Converging to the same hypothesis on two functions precludes
+learning in the limit.\<close>
+
+lemma same_hyp_for_two_not_Lim:
+  assumes "f\<^sub>1 \<in> U"
+    and "f\<^sub>2 \<in> U"
+    and "f\<^sub>1 \<noteq> f\<^sub>2"
+    and "\<forall>n\<ge>n\<^sub>1. s (f\<^sub>1 \<triangleright> n) = h"
+    and "\<forall>n\<ge>n\<^sub>2. s (f\<^sub>2 \<triangleright> n) = h"
+  shows "\<not> learn_lim \<psi> U s"
+  using assms learn_limE by (metis le_cases option.sel)
+
+text \<open>Every class that can be learned in the limit can be learned in
+the limit with respect to any Gödel numbering. We prove a generalization in
+which hypotheses may have to satisfy an extra condition, so we can re-use it
+for other inference types later.\<close>
+
+lemma learn_lim_extra_wrt_goedel:
+  fixes extra :: "(partial1 set) \<Rightarrow> partial1 \<Rightarrow> nat \<Rightarrow> partial1 \<Rightarrow> bool"
+  assumes "goedel_numbering \<chi>"
+    and "learn_lim \<psi> U s"
+    and "\<And>f n. f \<in> U \<Longrightarrow> extra U f n (\<psi> (the (s (f \<triangleright> n))))"
+  shows "\<exists>t. learn_lim \<chi> U t \<and> (\<forall>f\<in>U. \<forall>n. extra U f n (\<chi> (the (t (f \<triangleright> n)))))"
+proof -
+  have env: "environment \<psi> U s"
+    and lim: "learn_lim \<psi> U s"
+    and extra: "\<forall>f\<in>U. \<forall>n. extra U f n (\<psi> (the (s (f \<triangleright> n))))"
+    using assms learn_limE by auto
+  obtain c where c: "c \<in> \<R>" "\<forall>i. \<psi> i = \<chi> (the (c i))"
+    using env goedel_numberingE[OF assms(1), of \<psi>] by auto
+  define t where "t \<equiv>
+    (\<lambda>x. if s x \<down> \<and> c (the (s x)) \<down> then Some (the (c (the (s x)))) else None)"
+  have "t \<in> \<P>"
+    unfolding t_def using env c concat_P1_P1[of c s] by auto
+  have "t x = (if s x \<down> then Some (the (c (the (s x)))) else None)" for x
+    using t_def c(1) R1_imp_total1 by auto
+  then have t: "t (f \<triangleright> n) \<down>= the (c (the (s (f \<triangleright> n))))" if "f \<in> U" for f n
+    using lim learn_limE that by simp
+  have "learn_lim \<chi> U t"
+  proof (rule learn_limI)
+    show "environment \<chi> U t"
+      using t by (simp add: \<open>t \<in> \<P>\<close> env goedel_numbering_P2[OF assms(1)])
+    show "\<exists>i. \<chi> i = f \<and> (\<forall>\<^sup>\<infinity>n. t (f \<triangleright> n) \<down>= i)" if "f \<in> U" for f
+    proof -
+      from lim learn_limE(2) obtain i n\<^sub>0 where
+        i: "\<psi> i = f \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= i)"
+        using \<open>f \<in> U\<close> by blast
+      let ?j = "the (c i)"
+      have "\<chi> ?j = f"
+        using c(2) i by simp
+      moreover have "t (f \<triangleright> n) \<down>= ?j" if "n \<ge> n\<^sub>0" for n
+        by (simp add: \<open>f \<in> U\<close> i t that)
+      ultimately show ?thesis by auto
+    qed
+  qed
+  moreover have "extra U f n (\<chi> (the (t (f \<triangleright> n))))" if "f \<in> U" for f n
+  proof -
+    from t have "the (t (f \<triangleright> n)) = the (c (the (s (f \<triangleright> n))))"
+      by (simp add: that)
+    then have "\<chi> (the (t (f \<triangleright> n))) = \<psi> (the (s (f \<triangleright> n)))"
+      using c(2) by simp
+    with extra show ?thesis using that by simp
+  qed
+  ultimately show ?thesis by auto
+qed
+
+lemma learn_lim_wrt_goedel:
+  assumes "goedel_numbering \<chi>" and "learn_lim \<psi> U s"
+  shows "\<exists>t. learn_lim \<chi> U t"
+  using assms learn_lim_extra_wrt_goedel[where ?extra="\<lambda>U f n h. True"]
+  by simp
+
+lemma LIM_wrt_phi_eq_Lim: "LIM_wrt \<phi> = LIM"
+  using LIM_wrt_def Lim_def learn_lim_wrt_goedel[OF goedel_numbering_phi]
+  by blast
+
+
+subsection \<open>BC: Behaviorally correct learning in the limit\<close>
+
+text \<open>Behaviorally correct learning in the limit relaxes LIM by
+requiring that the strategy almost always output an index for the target
+function, but not necessarily the same index. In other words convergence of
+$(S(f^n))_{n\in\mathbb{N}}$ is replaced by convergence of
+$(\psi_{S(f^n)})_{n\in\mathbb{N}}$.\<close>
+
+definition learn_bc :: "partial2 \<Rightarrow> (partial1 set) \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "learn_bc \<psi> U s \<equiv> 
+     environment \<psi> U s \<and>
+     (\<forall>f\<in>U. \<forall>\<^sup>\<infinity>n. \<psi> (the (s (f \<triangleright> n))) = f)"
+
+lemma learn_bcE:
+  assumes "learn_bc \<psi> U s"
+  shows "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<forall>\<^sup>\<infinity>n. \<psi> (the (s (f \<triangleright> n))) = f"
+  using assms learn_bc_def by auto
+
+lemma learn_bcI:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<forall>\<^sup>\<infinity>n. \<psi> (the (s (f \<triangleright> n))) = f"
+  shows "learn_bc \<psi> U s"
+  using assms learn_bc_def by auto
+
+definition BC_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "BC_wrt \<psi> \<equiv> {U. \<exists>s. learn_bc \<psi> U s}"
+
+definition BC :: "partial1 set set" where
+  "BC \<equiv> {U. \<exists>\<psi> s. learn_bc \<psi> U s}"
+
+text \<open>BC is a superset of LIM and closed under the subset relation.\<close>
+
+lemma learn_lim_imp_BC: "learn_lim \<psi> U s \<Longrightarrow> learn_bc \<psi> U s"
+  using learn_limE learn_bcI[of \<psi> U s] by fastforce
+
+lemma Lim_subseteq_BC: "LIM \<subseteq> BC"
+  using learn_lim_imp_BC Lim_def BC_def by blast
+
+lemma learn_bc_closed_subseteq:
+  assumes "learn_bc \<psi> U s" and "V \<subseteq> U"
+  shows "learn_bc \<psi> V s"
+  using assms learn_bc_def by auto
+
+corollary BC_closed_subseteq:
+  assumes "U \<in> BC" and "V \<subseteq> U"
+  shows "V \<in> BC"
+  using assms by (smt BC_def learn_bc_closed_subseteq mem_Collect_eq)
+
+text \<open>Just like with LIM, guessing a wrong hypothesis infinitely often
+precludes BC-style learning.\<close>
+
+lemma infinite_hyp_wrong_not_BC:
+  assumes "f \<in> U" and "\<forall>n. \<exists>m>n. \<psi> (the (s (f \<triangleright> m))) \<noteq> f"
+  shows "\<not> learn_bc \<psi> U s"
+proof
+  assume "learn_bc \<psi> U s"
+  then obtain n\<^sub>0 where "\<forall>n\<ge>n\<^sub>0. \<psi> (the (s (f \<triangleright> n))) = f"
+    using learn_bcE assms(1) by metis
+  with assms(2) show False using less_imp_le by blast
+qed
+
+text \<open>The proof that Gödel numberings suffice as hypothesis spaces for
+BC is similar to the one for @{thm[source] learn_lim_extra_wrt_goedel}. We do
+not need the @{term extra} part for BC, but we get it for free.\<close>
+
+lemma learn_bc_extra_wrt_goedel:
+  fixes extra :: "(partial1 set) \<Rightarrow> partial1 \<Rightarrow> nat \<Rightarrow> partial1 \<Rightarrow> bool"
+  assumes "goedel_numbering \<chi>"
+    and "learn_bc \<psi> U s"
+    and "\<And>f n. f \<in> U \<Longrightarrow> extra U f n (\<psi> (the (s (f \<triangleright> n))))"
+  shows "\<exists>t. learn_bc \<chi> U t \<and> (\<forall>f\<in>U. \<forall>n. extra U f n (\<chi> (the (t (f \<triangleright> n)))))"
+proof -
+  have env: "environment \<psi> U s"
+    and lim: "learn_bc \<psi> U s"
+    and extra: "\<forall>f\<in>U. \<forall>n. extra U f n (\<psi> (the (s (f \<triangleright> n))))"
+    using assms learn_bc_def by auto
+  obtain c where c: "c \<in> \<R>" "\<forall>i. \<psi> i = \<chi> (the (c i))"
+    using env goedel_numberingE[OF assms(1), of \<psi>] by auto
+  define t where
+    "t = (\<lambda>x. if s x \<down> \<and> c (the (s x)) \<down> then Some (the (c (the (s x)))) else None)"
+  have "t \<in> \<P>"
+    unfolding t_def using env c concat_P1_P1[of c s] by auto
+  have "t x = (if s x \<down> then Some (the (c (the (s x)))) else None)" for x
+    using t_def c(1) R1_imp_total1 by auto
+  then have t: "t (f \<triangleright> n) \<down>= the (c (the (s (f \<triangleright> n))))" if "f \<in> U" for f n
+    using lim learn_bcE(1) that by simp
+  have "learn_bc \<chi> U t"
+  proof (rule learn_bcI)
+    show "environment \<chi> U t"
+      using t by (simp add: \<open>t \<in> \<P>\<close> env goedel_numbering_P2[OF assms(1)])
+    show "\<forall>\<^sup>\<infinity>n. \<chi> (the (t (f \<triangleright> n))) = f" if "f \<in> U" for f
+    proof -
+      obtain n\<^sub>0 where "\<forall>n\<ge>n\<^sub>0. \<psi> (the (s (f \<triangleright> n))) = f"
+        using lim learn_bcE(2) \<open>f \<in> U\<close> by blast
+      then show ?thesis using that t c(2) by auto
+    qed
+  qed
+  moreover have "extra U f n (\<chi> (the (t (f \<triangleright> n))))" if "f \<in> U" for f n
+  proof -
+    from t have "the (t (f \<triangleright> n)) = the (c (the (s (f \<triangleright> n))))"
+      by (simp add: that)
+    then have "\<chi> (the (t (f \<triangleright> n))) = \<psi> (the (s (f \<triangleright> n)))"
+      using c(2) by simp
+    with extra show ?thesis using that by simp
+  qed
+  ultimately show ?thesis by auto
+qed
+
+corollary learn_bc_wrt_goedel:
+  assumes "goedel_numbering \<chi>" and "learn_bc \<psi> U s"
+  shows "\<exists>t. learn_bc \<chi> U t"
+  using assms learn_bc_extra_wrt_goedel[where ?extra="\<lambda>_ _ _ _. True"] by simp
+
+corollary BC_wrt_phi_eq_BC: "BC_wrt \<phi> = BC"
+  using learn_bc_wrt_goedel goedel_numbering_phi BC_def BC_wrt_def by blast
+
+
+subsection \<open>CONS: Learning in the limit with consistent hypotheses\<close>
+
+text \<open>A hypothesis is \emph{consistent} if it matches all values in the
+prefix given to the strategy. Consistent learning in the limit requires the
+strategy to output only consistent hypotheses for prefixes from the class.\<close>
+
+definition learn_cons :: "partial2 \<Rightarrow> (partial1 set) \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "learn_cons \<psi> U s \<equiv>
+     learn_lim \<psi> U s \<and>
+     (\<forall>f\<in>U. \<forall>n. \<forall>k\<le>n. \<psi> (the (s (f \<triangleright> n))) k = f k)"
+
+definition CONS_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "CONS_wrt \<psi> \<equiv> {U. \<exists>s. learn_cons \<psi> U s}"
+
+definition CONS :: "partial1 set set" where
+  "CONS \<equiv> {U. \<exists>\<psi> s. learn_cons \<psi> U s}"
+
+lemma CONS_subseteq_Lim: "CONS \<subseteq> LIM"
+  using CONS_def Lim_def learn_cons_def by blast
+
+lemma learn_consI:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<forall>k\<le>n. \<psi> (the (s (f \<triangleright> n))) k = f k"
+  shows "learn_cons \<psi> U s"
+  using assms learn_lim_def learn_cons_def by simp
+
+text \<open>If a consistent strategy converges, it automatically converges to
+a correct hypothesis. Thus we can remove @{term "\<psi> i = f"} from the second
+assumption in the previous lemma.\<close>
+
+lemma learn_consI2:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<forall>k\<le>n. \<psi> (the (s (f \<triangleright> n))) k = f k"
+  shows "learn_cons \<psi> U s"
+proof (rule learn_consI)
+  show "environment \<psi> U s"
+    and cons: "\<And>f n. f \<in> U \<Longrightarrow> \<forall>k\<le>n. \<psi> (the (s (f \<triangleright> n))) k = f k"
+    using assms by simp_all
+  show "\<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)" if "f \<in> U" for f
+  proof -
+    from that assms(2) obtain i n\<^sub>0 where i_n0: "\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= i"
+      by blast
+    have "\<psi> i x = f x" for x
+    proof (cases "x \<le> n\<^sub>0")
+      case True
+      then show ?thesis
+        using i_n0 cons that by fastforce
+    next
+      case False
+      moreover have "\<forall>k\<le>x. \<psi> (the (s (f \<triangleright> x))) k = f k"
+        using cons that by simp
+      ultimately show ?thesis using i_n0 by simp
+    qed
+    with i_n0 show ?thesis by auto
+  qed
+qed
+
+lemma learn_consE:
+  assumes "learn_cons \<psi> U s"
+  shows "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<forall>k\<le>n. \<psi> (the (s (f \<triangleright> n))) k = f k"
+  using assms learn_cons_def learn_lim_def by auto
+
+lemma learn_cons_wrt_goedel:
+  assumes "goedel_numbering \<chi>" and "learn_cons \<psi> U s"
+  shows "\<exists>t. learn_cons \<chi> U t"
+  using learn_cons_def assms
+    learn_lim_extra_wrt_goedel[where ?extra="\<lambda>U f n h. \<forall>k\<le>n. h k = f k"]
+  by auto
+
+lemma CONS_wrt_phi_eq_CONS: "CONS_wrt \<phi> = CONS"
+  using CONS_wrt_def CONS_def learn_cons_wrt_goedel goedel_numbering_phi
+  by blast
+
+lemma learn_cons_closed_subseteq:
+  assumes "learn_cons \<psi> U s" and "V \<subseteq> U"
+  shows "learn_cons \<psi> V s"
+  using assms learn_cons_def learn_lim_closed_subseteq by auto
+
+lemma CONS_closed_subseteq:
+  assumes "U \<in> CONS" and "V \<subseteq> U"
+  shows "V \<in> CONS"
+  using assms learn_cons_closed_subseteq by (smt CONS_def mem_Collect_eq)
+
+text \<open>A consistent strategy cannot output the same hypothesis for two
+different prefixes from the class to be learned.\<close>
+
+lemma same_hyp_different_init_not_cons:
+  assumes "f \<in> U"
+    and "g \<in> U"
+    and "f \<triangleright> n \<noteq> g \<triangleright> n"
+    and "s (f \<triangleright> n) = s (g \<triangleright> n)"
+  shows "\<not> learn_cons \<phi> U s"
+  unfolding learn_cons_def by (auto, metis assms init_eqI)
+
+
+subsection \<open>TOTAL: Learning in the limit with total hypotheses\<close>
+
+text \<open>Total learning in the limit requires the strategy to hypothesize
+only total functions for prefixes from the class.\<close>
+
+definition learn_total :: "partial2 \<Rightarrow> (partial1 set) \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "learn_total \<psi> U s \<equiv>
+     learn_lim \<psi> U s \<and>
+     (\<forall>f\<in>U. \<forall>n. \<psi> (the (s (f \<triangleright> n))) \<in> \<R>)"
+
+definition TOTAL_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "TOTAL_wrt \<psi> \<equiv> {U. \<exists>s. learn_total \<psi> U s}"
+
+definition TOTAL :: "partial1 set set" where
+  "TOTAL \<equiv> {U. \<exists>\<psi> s. learn_total \<psi> U s}"
+
+lemma TOTAL_subseteq_LIM: "TOTAL \<subseteq> LIM"
+  unfolding TOTAL_def Lim_def using learn_total_def by auto
+
+lemma learn_totalI:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<psi> (the (s (f \<triangleright> n))) \<in> \<R>"
+  shows "learn_total \<psi> U s"
+  using assms learn_lim_def learn_total_def by auto
+
+lemma learn_totalE:
+  assumes "learn_total \<psi> U s"
+  shows "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<psi> (the (s (f \<triangleright> n))) \<in> \<R>"
+  using assms learn_lim_def learn_total_def by auto
+
+lemma learn_total_wrt_goedel:
+  assumes "goedel_numbering \<chi>" and "learn_total \<psi> U s"
+  shows "\<exists>t. learn_total \<chi> U t"
+  using learn_total_def assms learn_lim_extra_wrt_goedel[where ?extra="\<lambda>U f n h. h \<in> \<R>"]
+  by auto
+
+lemma TOTAL_wrt_phi_eq_TOTAL: "TOTAL_wrt \<phi> = TOTAL"
+  using TOTAL_wrt_def TOTAL_def learn_total_wrt_goedel goedel_numbering_phi
+  by blast
+
+lemma learn_total_closed_subseteq:
+  assumes "learn_total \<psi> U s" and "V \<subseteq> U"
+  shows "learn_total \<psi> V s"
+  using assms learn_total_def learn_lim_closed_subseteq by auto
+
+lemma TOTAL_closed_subseteq:
+  assumes "U \<in> TOTAL" and "V \<subseteq> U"
+  shows "V \<in> TOTAL"
+  using assms learn_total_closed_subseteq by (smt TOTAL_def mem_Collect_eq)
+
+
+subsection \<open>CP: Learning in the limit with class-preserving hypotheses\<close>
+
+text \<open>Class-preserving learning in the limit requires all hypotheses
+for prefixes from the class to be functions from the class.\<close>
+
+definition learn_cp :: "partial2 \<Rightarrow> (partial1 set) \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "learn_cp \<psi> U s \<equiv>
+     learn_lim \<psi> U s \<and>
+     (\<forall>f\<in>U. \<forall>n. \<psi> (the (s (f \<triangleright> n))) \<in> U)"
+
+definition CP_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "CP_wrt \<psi> \<equiv> {U. \<exists>s. learn_cp \<psi> U s}"
+
+definition CP :: "partial1 set set" where
+  "CP \<equiv> {U. \<exists>\<psi> s. learn_cp \<psi> U s}"
+
+lemma learn_cp_wrt_goedel:
+  assumes "goedel_numbering \<chi>" and "learn_cp \<psi> U s"
+  shows "\<exists>t. learn_cp \<chi> U t"
+  using learn_cp_def assms learn_lim_extra_wrt_goedel[where ?extra="\<lambda>U f n h. h \<in> U"]
+  by auto
+
+corollary CP_wrt_phi: "CP = CP_wrt \<phi>"
+  using learn_cp_wrt_goedel[OF goedel_numbering_phi]
+  by (smt CP_def CP_wrt_def Collect_cong)
+
+lemma learn_cpI:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. \<psi> i = f \<and> (\<forall>\<^sup>\<infinity>n. s (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<psi> (the (s (f \<triangleright> n))) \<in> U"
+  shows "learn_cp \<psi> U s"
+  using assms learn_cp_def learn_lim_def by auto
+
+lemma learn_cpE:
+  assumes "learn_cp \<psi> U s"
+  shows "environment \<psi> U s"
+    and "\<And>f. f \<in>  U \<Longrightarrow> \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> U \<Longrightarrow> \<psi> (the (s (f \<triangleright> n))) \<in> U"
+  using assms learn_lim_def learn_cp_def by auto
+
+text \<open>Since classes contain only total functions, a CP strategy is also
+a TOTAL strategy.\<close>
+
+lemma learn_cp_imp_total: "learn_cp \<psi> U s \<Longrightarrow> learn_total \<psi> U s"
+  using learn_cp_def learn_total_def learn_lim_def by auto
+
+lemma CP_subseteq_TOTAL: "CP \<subseteq> TOTAL"
+  using learn_cp_imp_total CP_def TOTAL_def by blast
+
+
+subsection \<open>FIN: Finite learning\<close>
+
+text \<open>In general it is undecidable whether a LIM strategy has reached
+its final hypothesis. By contrast, in finite learning (also called ``one-shot
+learning'') the strategy signals when it is ready to output a hypothesis. Up
+until then it outputs a ``don't know yet'' value. This value is represented
+by zero and the actual hypothesis $i$ by $i + 1$.\<close>
+
+definition learn_fin :: "partial2 \<Rightarrow> partial1 set \<Rightarrow> partial1 \<Rightarrow> bool" where
+  "learn_fin \<psi> U s \<equiv>
+     environment \<psi> U s \<and>
+     (\<forall>f \<in> U. \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i))"
+
+definition FIN_wrt :: "partial2 \<Rightarrow> partial1 set set" where
+  "FIN_wrt \<psi> \<equiv> {U. \<exists>s. learn_fin \<psi> U s}"
+
+definition FIN :: "partial1 set set" where
+  "FIN \<equiv> {U. \<exists>\<psi> s. learn_fin \<psi> U s}"
+
+lemma learn_finI:
+  assumes "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow>
+      \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+  shows "learn_fin \<psi> U s"
+  using assms learn_fin_def by auto
+
+lemma learn_finE:
+  assumes "learn_fin \<psi> U s"
+  shows "environment \<psi> U s"
+    and "\<And>f. f \<in> U \<Longrightarrow>
+      \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+  using assms learn_fin_def by auto
+
+lemma learn_fin_closed_subseteq:
+  assumes "learn_fin \<psi> U s" and "V \<subseteq> U"
+  shows "learn_fin \<psi> V s"
+  using assms learn_fin_def by auto
+
+lemma learn_fin_wrt_goedel:
+  assumes "goedel_numbering \<chi>" and "learn_fin \<psi> U s"
+  shows "\<exists>t. learn_fin \<chi> U t"
+proof -
+  have env: "environment \<psi> U s"
+    and fin: "\<And>f. f \<in> U \<Longrightarrow>
+      \<exists>i n\<^sub>0. \<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+    using assms(2) learn_finE by auto
+  obtain c where c: "c \<in> \<R>" "\<forall>i. \<psi> i = \<chi> (the (c i))"
+    using env goedel_numberingE[OF assms(1), of \<psi>] by auto
+  define t where "t \<equiv>
+    \<lambda>x. if s x \<up> then None
+         else if s x = Some 0 then Some 0
+              else Some (Suc (the (c (the (s x) - 1))))"
+  have "t \<in> \<P>"
+  proof -
+    from c obtain rc where rc:
+      "recfn 1 rc"
+      "total rc"
+      "\<forall>x. c x = eval rc [x]"
+      by auto
+    from env obtain rs where rs: "recfn 1 rs" "\<forall>x. s x = eval rs [x]"
+      by auto
+    then have "eval rs [f \<triangleright> n] \<down>" if "f \<in> U" for f n
+      using env that by simp
+    define rt where "rt = Cn 1 r_ifz [rs, Z, Cn 1 S [Cn 1 rc [Cn 1 r_dec [rs]]]]"
+    then have "recfn 1 rt"
+      using rc(1) rs(1) by simp
+    have "eval rt [x] \<up>" if "eval rs [x] \<up>" for x
+      using rc(1) rs(1) rt_def that by auto
+    moreover have "eval rt [x] \<down>= 0" if "eval rs [x] \<down>= 0" for x
+      using rt_def that rc(1,2) rs(1) by simp
+    moreover have "eval rt [x] \<down>= Suc (the (c (the (s x) - 1)))" if "eval rs [x] \<down>\<noteq> 0" for x
+      using rt_def that rc rs by auto
+    ultimately have "eval rt [x] = t x" for x
+      by (simp add: rs(2) t_def)
+    with `recfn 1 rt` show ?thesis by auto
+  qed
+  have t: "t (f \<triangleright> n) \<down>=
+      (if s (f \<triangleright> n) = Some 0 then 0 else Suc (the (c (the (s (f \<triangleright> n)) - 1))))"
+    if "f \<in> U" for f n
+    using that env by (simp add: t_def)
+  have "learn_fin \<chi> U t"
+  proof (rule learn_finI)
+    show "environment \<chi> U t"
+      using t by (simp add: \<open>t \<in> \<P>\<close> env goedel_numbering_P2[OF assms(1)])
+    show "\<exists>i n\<^sub>0. \<chi> i = f \<and> (\<forall>n<n\<^sub>0. t (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. t (f \<triangleright> n) \<down>= Suc i)"
+      if "f \<in> U" for f
+    proof -
+      from fin obtain i n\<^sub>0 where
+        i: "\<psi> i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+        using \<open>f \<in> U\<close> by blast
+      let ?j = "the (c i)"
+      have "\<chi> ?j = f"
+        using c(2) i by simp
+      moreover have "\<forall>n<n\<^sub>0. t (f \<triangleright> n) \<down>= 0"
+        using t[OF that] i by simp
+      moreover have "t (f \<triangleright> n) \<down>= Suc ?j" if "n \<ge> n\<^sub>0" for n
+        using that i t[OF `f \<in> U`] by simp
+      ultimately show ?thesis by auto
+    qed
+  qed
+  then show ?thesis by auto
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/LIM_BC.thy b/thys/Inductive_Inference/LIM_BC.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/LIM_BC.thy
@@ -0,0 +1,1329 @@
+section \<open>LIM is a proper subset of BC\label{s:lim_bc}\<close>
+
+theory LIM_BC
+  imports Lemma_R
+begin
+
+text \<open>The proper inclusion of LIM in BC has been proved by
+Barzdin~\cite{b-ttlsf-74} (see also Case and Smith~\cite{cs-cicmii-83}). The
+proof constructs a class $V \in \mathrm{BC} - \mathrm{LIM}$ by
+diagonalization against all LIM strategies. Exploiting Lemma~R for LIM, we
+can assume that all such strategies are total functions. From the effective
+version of this lemma we derive a numbering @{term "\<sigma> \<in>
+\<R>\<^sup>2"} such that for all $U \in \mathrm{LIM}$ there is an $i$ with
+$U\in \mathrm{LIM}_\varphi(\sigma_i)$. The idea behind $V$
+is for every $i$ to construct a class $V_i$ of cardinality one or two such
+that $V_i \notin \mathrm{LIM}_\varphi(\sigma_i)$. It then follows that the
+union $V := \bigcup_i V_i$ cannot be learned by any $\sigma_i$ and thus $V
+\notin \mathrm{LIM}$. At the same time, the construction ensures that the
+functions in $V$ are ``predictable enough'' to be learnable in the BC sense.
+
+At the core is a process that maintains a state $(b, k)$ of a list $b$ of
+numbers and an index $k < |b|$ into this list. We imagine $b$ to be the
+prefix of the function being constructed, except for position $k$ where
+we imagine $b$ to have a ``gap''; that is, $b_k$ is not defined yet.
+Technically, we will always have $b_k = 0$, so $b$ also represents the prefix
+after the ``gap is filled'' with 0, whereas $b_{k:=1}$ represents the prefix
+where the gap is filled with 1. For every $i \in \mathbb{N}$, the process
+starts in state $(i0, 1)$ and computes the next state from a given state
+$(b,k)$ as follows:
+\begin{enumerate}
+\item if $ \sigma_i(b_{<k}) \neq \sigma_i(b)$ then the next state is $(b0, |b|)$,
+\item else if $\sigma_i(b_{<k}) \neq \sigma_i(b_{k:=1})$ then the next state is $(b_{k:=1}0, |b|)$,
+\item else the next state is $(b0, k)$.
+\end{enumerate}
+In other words, if $\sigma_i$ changes its hypothesis when the gap in $b$ is
+filled with 0 or 1, then the process fills the gap with 0 or 1, respectively, and
+appends a gap to $b$. If, however, a hypothesis change cannot be enforced at
+this point, the process appends a 0 to $b$ and leaves the gap alone. Now there
+are two cases:
+\begin{itemize}
+\item[Case 1.] Every gap gets filled eventually. Then the process generates
+increasing prefixes of a total function $\tau_i$, on which $\sigma_i$ changes
+its hypothesis infinitely often. We set $V_i := \{\tau_i\}$, and have $V_i \notin
+\mathrm{LIM}_\varphi(\sigma_i)$.
+\item[Case 2.] Some gap never gets filled. That means a state $(b, k)$ is
+reached such that $\sigma_i(b0^t) = \sigma_i(b_{k:=1}0^t) = \sigma_i(b_{<k})$
+for all $t$. Then the process describes a function $\tau_i = b_{<k}\uparrow0^\infty$,
+where the value at the gap $k$ is undefined.
+Replacing the value at $k$ by 0 and 1 yields two functions
+$\tau_i^{(0)} = b0^\infty$ and $\tau_i^{(1)} = b_{k:=1}0^\infty$, which differ only at $k$ and on
+which $\sigma_i$ converges to the same hypothesis. Thus $\sigma_i$ does not learn the
+class $V_i := \{\tau_i^{(0)}, \tau_i^{(1)}\}$ in the limit.
+\end{itemize}
+Both cases combined imply $V \notin \mathrm{LIM}$.
+
+A BC strategy $S$ for $V = \bigcup_i V_i$ works as follows. Let $f\in V$. On input $f^n$ the
+strategy outputs a Gödel number of the function
+\[
+g_n(x) = \left\{\begin{array}{ll}
+    f(x) & \mbox{if } x \leq n,\\
+    \tau_{f(0)}(x) & \mbox{otherwise}.
+\end{array}\right.
+\]
+By definition of $V$, $f$ is generated by the process running for $i = f(0)$.
+If $f(0)$ leads to Case~1 then $f = \tau_{f(0)}$, and
+$g_n$ equals $f$ for all $n$. If $f(0)$ leads to Case~2 with
+a forever unfilled gap at $k$, then
+$g_n$ will be equal to the correct one of $\tau_i^{(0)}$ or $\tau_i^{(1)}$ for all $n
+\geq k$. Intuitively, the prefix received by $S$ eventually grows long enough to
+reveal the value $f(k)$.
+In both cases $S$ converges to $f$, but it outputs a different Gödel number
+for every $f^n$ because $g_n$ contains the ``hard-coded'' values
+$f(0),\dots,f(n)$. Therefore $S$ is a BC strategy but not a LIM
+strategy for $V$.\<close>
+
+
+subsection \<open>Enumerating enough total strategies\<close>
+
+text \<open>For the construction of $\sigma$ we need the function @{term
+r_limr} from the effective version of Lemma~R for LIM.\<close>
+
+definition "r_sigma \<equiv> Cn 2 r_phi [Cn 2 r_limr [Id 2 0], Id 2 1]"
+
+lemma r_sigma_recfn: "recfn 2 r_sigma"
+  unfolding r_sigma_def using r_limr_recfn by simp
+
+lemma r_sigma: "eval r_sigma [i, x] = \<phi> (the (eval r_limr [i])) x"
+  unfolding r_sigma_def phi_def using r_sigma_recfn r_limr_total r_limr_recfn
+  by simp
+
+lemma r_sigma_total: "total r_sigma"
+  using r_sigma r_limr r_sigma_recfn totalI2[of r_sigma] by simp
+
+abbreviation sigma :: partial2 ("\<sigma>") where
+  "\<sigma> i x \<equiv> eval r_sigma [i, x]"
+
+lemma sigma: "\<sigma> i = \<phi> (the (eval r_limr [i]))"
+  using r_sigma by simp
+
+text \<open>The numbering @{term \<sigma>} does indeed enumerate enough total
+strategies for every LIM learning problem.\<close>
+
+lemma learn_lim_sigma:
+  assumes "learn_lim \<psi> U (\<phi> i)"
+  shows "learn_lim \<psi> U (\<sigma> i)"
+  using assms sigma r_limr by simp
+
+
+subsection \<open>The diagonalization process\<close>
+
+text \<open>The following function represents the process described above. It
+computes the next state from a given state $(b, k)$.\<close>
+
+definition "r_next \<equiv>
+  Cn 1 r_ifeq
+   [Cn 1 r_sigma [Cn 1 r_hd [r_pdec1], r_pdec1],
+    Cn 1 r_sigma [Cn 1 r_hd [r_pdec1], Cn 1 r_take [r_pdec2, r_pdec1]],
+    Cn 1 r_ifeq
+     [Cn 1 r_sigma [Cn 1 r_hd [r_pdec1], Cn 1 r_update [r_pdec1, r_pdec2, r_const 1]],
+      Cn 1 r_sigma [Cn 1 r_hd [r_pdec1], Cn 1 r_take [r_pdec2, r_pdec1]],
+      Cn 1 r_prod_encode [Cn 1 r_snoc [r_pdec1, Z], r_pdec2],
+      Cn 1 r_prod_encode
+       [Cn 1 r_snoc
+         [Cn 1 r_update [r_pdec1, r_pdec2, r_const 1], Z], Cn 1 r_length [r_pdec1]]],
+    Cn 1 r_prod_encode [Cn 1 r_snoc [r_pdec1, Z], Cn 1 r_length [r_pdec1]]]"
+
+lemma r_next_recfn: "recfn 1 r_next"
+  unfolding r_next_def using r_sigma_recfn by simp
+
+text \<open>The three conditions distinguished in @{term r_next} correspond
+to Steps 1, 2, and 3 of the process: hypothesis change when the gap is
+filled with 0; hypothesis change when the gap is filled with 1; or
+no hypothesis change either way.\<close>
+
+abbreviation "change_on_0 b k \<equiv> \<sigma> (e_hd b) b \<noteq> \<sigma> (e_hd b) (e_take k b)"
+
+abbreviation "change_on_1 b k \<equiv>
+  \<sigma> (e_hd b) b = \<sigma> (e_hd b) (e_take k b) \<and>
+  \<sigma> (e_hd b) (e_update b k 1) \<noteq> \<sigma> (e_hd b) (e_take k b)"
+
+abbreviation "change_on_neither b k \<equiv>
+  \<sigma> (e_hd b) b = \<sigma> (e_hd b) (e_take k b) \<and>
+  \<sigma> (e_hd b) (e_update b k 1) = \<sigma> (e_hd b) (e_take k b)"
+
+lemma change_conditions:
+  obtains
+    (on_0) "change_on_0 b k"
+  | (on_1) "change_on_1 b k"
+  | (neither) "change_on_neither b k"
+  by auto
+
+lemma r_next:
+  assumes "arg = prod_encode (b, k)"
+  shows "change_on_0 b k \<Longrightarrow> eval r_next [arg] \<down>= prod_encode (e_snoc b 0, e_length b)"
+    and "change_on_1 b k \<Longrightarrow>
+      eval r_next [arg] \<down>= prod_encode (e_snoc (e_update b k 1) 0, e_length b)"
+    and "change_on_neither b k \<Longrightarrow> eval r_next [arg] \<down>= prod_encode (e_snoc b 0, k)"
+proof -
+  let ?bhd = "Cn 1 r_hd [r_pdec1]"
+  let ?bup = "Cn 1 r_update [r_pdec1, r_pdec2, r_const 1]"
+  let ?bk = "Cn 1 r_take [r_pdec2, r_pdec1]"
+  let ?bap = "Cn 1 r_snoc [r_pdec1, Z]"
+  let ?len = "Cn 1 r_length [r_pdec1]"
+  let ?thenthen = "Cn 1 r_prod_encode [?bap, r_pdec2]"
+  let ?thenelse = "Cn 1 r_prod_encode [Cn 1 r_snoc [?bup, Z], ?len]"
+  let ?else = "Cn 1 r_prod_encode [?bap, ?len]"
+  have bhd: "eval ?bhd [arg] \<down>= e_hd b"
+    using assms by simp
+  have bup: "eval ?bup [arg] \<down>= e_update b k 1"
+    using assms by simp
+  have bk: "eval ?bk [arg] \<down>= e_take k b"
+    using assms by simp
+  have bap: "eval ?bap [arg] \<down>= e_snoc b 0"
+    using assms by simp
+  have len: "eval ?len [arg] \<down>= e_length b"
+    using assms by simp
+  have else_: "eval ?else [arg] \<down>= prod_encode (e_snoc b 0, e_length b)"
+    using bap len by simp
+  have thenthen: "eval ?thenthen [arg] \<down>= prod_encode (e_snoc b 0, k)"
+    using bap assms by simp
+  have thenelse: "eval ?thenelse [arg] \<down>= prod_encode (e_snoc (e_update b k 1) 0, e_length b)"
+    using bup len by simp
+  have then_:
+    "eval
+      (Cn 1 r_ifeq [Cn 1 r_sigma [?bhd, ?bup], Cn 1 r_sigma [?bhd, ?bk], ?thenthen, ?thenelse])
+      [arg] \<down>=
+    (if the (\<sigma> (e_hd b) (e_update b k 1)) = the (\<sigma> (e_hd b) (e_take k b))
+     then prod_encode (e_snoc b 0, k)
+     else prod_encode (e_snoc (e_update b k 1) 0, e_length b))"
+    (is "eval ?then [arg] \<down>= ?then_eval")
+    using bhd bup bk thenthen thenelse r_sigma r_sigma_recfn r_limr R1_imp_total1 by simp
+  have *: "eval r_next [arg] \<down>=
+    (if the (\<sigma> (e_hd b) b) = the (\<sigma> (e_hd b) (e_take k b))
+     then ?then_eval
+     else prod_encode (e_snoc b 0, e_length b))"
+    unfolding r_next_def
+    using bhd bk then_ else_ r_sigma r_sigma_recfn r_limr R1_imp_total1 assms
+    by simp
+  have r_sigma_neq: "eval r_sigma [x\<^sub>1, y\<^sub>1] \<noteq> eval r_sigma [x\<^sub>2, y\<^sub>2] \<longleftrightarrow>
+      the (eval r_sigma [x\<^sub>1, y\<^sub>1]) \<noteq> the (eval r_sigma [x\<^sub>2, y\<^sub>2])"
+      for x\<^sub>1 y\<^sub>1 x\<^sub>2 y\<^sub>2
+    using r_sigma r_limr totalE[OF r_sigma_total r_sigma_recfn] r_sigma_recfn r_sigma_total
+    by (metis One_nat_def Suc_1 length_Cons list.size(3) option.expand)
+  {
+    assume "change_on_0 b k"
+    then show "eval r_next [arg] \<down>= prod_encode (e_snoc b 0, e_length b)"
+      using * r_sigma_neq by simp
+  next
+    assume "change_on_1 b k"
+    then show "eval r_next [arg] \<down>= prod_encode (e_snoc (e_update b k 1) 0, e_length b)"
+      using * r_sigma_neq by simp
+  next
+    assume "change_on_neither b k"
+    then show "eval r_next [arg] \<down>= prod_encode (e_snoc b 0, k)"
+      using * r_sigma_neq by simp
+  }
+qed
+
+lemma r_next_total: "total r_next"
+proof (rule totalI1)
+  show "recfn 1 r_next"
+    using r_next_recfn by simp
+  show "eval r_next [x] \<down>" for x
+  proof -
+    obtain b k where "x = prod_encode (b, k)"
+      using prod_encode_pdec'[of x] by metis
+    then show ?thesis using r_next by fast
+  qed
+qed
+
+text \<open>The next function computes the state of the process after
+any number of iterations.\<close>
+
+definition "r_state \<equiv>
+  Pr 1
+   (Cn 1 r_prod_encode [Cn 1 r_snoc [Cn 1 r_singleton_encode [Id 1 0], Z], r_const 1])
+   (Cn 3 r_next [Id 3 1])"
+
+lemma r_state_recfn: "recfn 2 r_state"
+  unfolding r_state_def using r_next_recfn by simp
+
+lemma r_state_at_0: "eval r_state [0, i] \<down>= prod_encode (list_encode [i, 0], 1)"
+proof -
+  let ?f = "Cn 1 r_prod_encode [Cn 1 r_snoc [Cn 1 r_singleton_encode [Id 1 0], Z], r_const 1]"
+  have "eval r_state [0, i] = eval ?f [i]"
+    unfolding r_state_def using r_next_recfn by simp
+  also have "... \<down>= prod_encode (list_encode [i, 0], 1)"
+    by (simp add: list_decode_singleton)
+  finally show ?thesis .
+qed
+
+lemma r_state_total: "total r_state"
+  unfolding r_state_def
+  using r_next_recfn totalE[OF r_next_total r_next_recfn] totalI3[of "Cn 3 r_next [Id 3 1]"]
+  by (intro Pr_total) auto
+
+text \<open>We call the components of a state $(b, k)$ the \emph{block} $b$
+and the \emph{gap} $k$.\<close>
+
+definition block :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "block i t \<equiv> pdec1 (the (eval r_state [t, i]))"
+
+definition gap :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "gap i t \<equiv> pdec2 (the (eval r_state [t, i]))"
+
+lemma state_at_0:
+  "block i 0 = list_encode [i, 0]"
+  "gap i 0 = 1"
+  unfolding block_def gap_def r_state_at_0 by simp_all
+
+text \<open>Some lemmas describing the behavior of blocks and gaps in
+one iteration of the process:\<close>
+  
+lemma state_Suc:
+  assumes "b = block i t" and "k = gap i t"
+  shows "block i (Suc t) = pdec1 (the (eval r_next [prod_encode (b, k)]))"
+    and "gap i (Suc t) = pdec2 (the (eval r_next [prod_encode (b, k)]))"
+proof -
+  have "eval r_state [Suc t, i] =
+      eval (Cn 3 r_next [Id 3 1]) [t, the (eval r_state [t, i]), i]"
+    using r_state_recfn r_next_recfn totalE[OF r_state_total r_state_recfn, of "[t, i]"]
+    by (simp add: r_state_def)
+  also have "... = eval r_next [the (eval r_state [t, i])]"
+    using r_next_recfn by simp
+  also have "... = eval r_next [prod_encode (b, k)]"
+    using assms block_def gap_def by simp
+  finally have "eval r_state [Suc t, i] = eval r_next [prod_encode (b, k)]" .
+  then show
+    "block i (Suc t) = pdec1 (the (eval r_next [prod_encode (b, k)]))"
+    "gap i (Suc t) = pdec2 (the (eval r_next [prod_encode (b, k)]))"
+    by (simp add: block_def, simp add: gap_def)
+qed
+
+lemma gap_Suc:
+  assumes "b = block i t" and "k = gap i t"
+  shows "change_on_0 b k \<Longrightarrow> gap i (Suc t) = e_length b"
+    and "change_on_1 b k \<Longrightarrow> gap i (Suc t) = e_length b"
+    and "change_on_neither b k\<Longrightarrow> gap i (Suc t) = k"
+  using assms r_next state_Suc by simp_all
+
+lemma block_Suc:
+  assumes "b = block i t" and "k = gap i t"
+  shows "change_on_0 b k \<Longrightarrow> block i (Suc t) = e_snoc b 0"
+    and "change_on_1 b k \<Longrightarrow> block i (Suc t) = e_snoc (e_update b k 1) 0"
+    and "change_on_neither b k\<Longrightarrow> block i (Suc t) = e_snoc b 0"
+  using assms r_next state_Suc by simp_all
+
+text \<open>Non-gap positions in the block remain unchanged after an
+iteration.\<close>
+  
+lemma block_stable:
+  assumes "j < e_length (block i t)" and "j \<noteq> gap i t"
+  shows "e_nth (block i t) j = e_nth (block i (Suc t)) j"
+proof -
+  from change_conditions[of "block i t" "gap i t"] show ?thesis
+    using assms block_Suc gap_Suc
+    by (cases, (simp_all add: nth_append))
+qed
+
+text \<open>Next are some properties of @{term block} and @{term gap}.\<close>
+  
+lemma gap_in_block: "gap i t < e_length (block i t)"
+proof (induction t)
+  case 0
+  then show ?case by (simp add: state_at_0)
+next
+  case (Suc t)
+  with change_conditions[of "block i t" "gap i t"] show ?case
+  proof (cases)
+    case on_0
+    then show ?thesis by (simp add: block_Suc(1) gap_Suc(1))
+  next
+    case on_1
+    then show ?thesis by (simp add: block_Suc(2) gap_Suc(2))
+  next
+    case neither
+    then show ?thesis using Suc.IH block_Suc(3) gap_Suc(3) by force
+  qed
+qed
+
+lemma length_block: "e_length (block i t) = Suc (Suc t)"
+proof (induction t)
+  case 0
+  then show ?case by (simp add: state_at_0)
+next
+  case (Suc t)
+  with change_conditions[of "block i t" "gap i t"] show ?case
+    by (cases, simp_all add: block_Suc gap_Suc)
+qed
+
+lemma gap_gr0: "gap i t > 0"
+proof (induction t)
+  case 0
+  then show ?case by (simp add: state_at_0)
+next
+  case (Suc t)
+  with change_conditions[of "block i t" "gap i t"] show ?case
+    using length_block by (cases, simp_all add: block_Suc gap_Suc)
+qed
+
+lemma hd_block: "e_hd (block i t) = i"
+proof (induction t)
+  case 0
+  then show ?case by (simp add: state_at_0)
+next
+  case (Suc t)
+  from change_conditions[of "block i t" "gap i t"] show ?case
+  proof (cases)
+    case on_0
+    then show ?thesis
+      using Suc block_Suc(1) length_block by (metis e_hd_snoc gap_Suc(1) gap_gr0)
+  next
+    case on_1
+    let ?b = "block i t" and ?k = "gap i t"
+    have "?k > 0"
+      using gap_gr0 Suc by simp
+    then have "e_nth (e_update ?b ?k 1) 0 = e_nth ?b 0"
+      by simp
+    then have *: "e_hd (e_update ?b ?k 1) = e_hd ?b"
+      using e_hd_nth0 gap_Suc(2)[of _ i t] gap_gr0 on_1 by (metis e_length_update)
+    from on_1 have "block i (Suc t) = e_snoc (e_update ?b ?k 1) 0"
+      by (simp add: block_Suc(2))
+    then show ?thesis
+      using e_hd_0 e_hd_snoc Suc length_block `?k > 0` *
+      by (metis e_length_update gap_Suc(2) gap_gr0 on_1)
+  next
+    case neither
+    then show ?thesis using Suc block_Suc(3) length_block by simp
+  qed
+qed
+
+text \<open>Formally, a block always ends in zero, even if it ends in a gap.\<close>
+  
+lemma last_block: "e_nth (block i t) (gap i t) = 0"
+proof (induction t)
+  case 0
+  then show ?case by (simp add: state_at_0)
+next
+  case (Suc t)
+  from change_conditions[of "block i t" "gap i t"] show ?case
+  proof cases
+    case on_0
+    then show ?thesis using Suc by (simp add: block_Suc(1) gap_Suc(1))
+  next
+    case on_1
+    then show ?thesis using Suc by (simp add: block_Suc(2) gap_Suc(2) nth_append)
+  next
+    case neither
+    then have
+      "block i (Suc t) = e_snoc (block i t) 0"
+      "gap i (Suc t) = gap i t"
+      by (simp_all add: gap_Suc(3) block_Suc(3))
+    then show ?thesis
+      using Suc gap_in_block by (simp add: nth_append)
+  qed
+qed
+
+lemma gap_le_Suc: "gap i t \<le> gap i (Suc t)"
+  using change_conditions[of "block i t" "gap i t"]
+    gap_Suc gap_in_block less_imp_le[of "gap i t" "e_length (block i t)"]
+  by (cases) simp_all
+
+lemma gap_monotone:
+  assumes "t\<^sub>1 \<le> t\<^sub>2"
+  shows "gap i t\<^sub>1 \<le> gap i t\<^sub>2"
+proof -
+  have "gap i t\<^sub>1 \<le> gap i (t\<^sub>1 + j)" for j
+  proof (induction j)
+    case 0
+    then show ?case by simp
+  next
+    case (Suc j)
+    then show ?case using gap_le_Suc dual_order.trans by fastforce
+  qed
+  then show ?thesis using assms le_Suc_ex by blast
+qed
+
+text \<open>We need some lemmas relating the shape of the next state
+to the hypothesis change conditions in Steps 1, 2, and 3.\<close>
+  
+lemma state_change_on_neither:
+  assumes "gap i (Suc t) = gap i t"
+  shows "change_on_neither (block i t) (gap i t)"
+    and "block i (Suc t) = e_snoc (block i t) 0"
+proof -
+  let ?b = "block i t" and ?k = "gap i t"
+  have "?k < e_length ?b"
+    using gap_in_block by simp
+  from change_conditions[of ?b ?k] show "change_on_neither (block i t) (gap i t)"
+  proof (cases)
+    case on_0
+    then show ?thesis
+      using \<open>?k < e_length ?b\<close> assms gap_Suc(1) by auto
+  next
+    case on_1
+    then show ?thesis using assms gap_Suc(2) by auto
+  next
+    case neither
+    then show ?thesis by simp
+  qed
+  then show "block i (Suc t) = e_snoc (block i t) 0"
+    using block_Suc(3) by simp
+qed
+
+lemma state_change_on_either:
+  assumes "gap i (Suc t) \<noteq> gap i t"
+  shows "\<not> change_on_neither (block i t) (gap i t)"
+    and "gap i (Suc t) = e_length (block i t)"
+proof -
+  let ?b = "block i t" and ?k = "gap i t"
+  show "\<not> change_on_neither (block i t) (gap i t)"
+  proof
+    assume "change_on_neither (block i t) (gap i t)"
+    then have "gap i (Suc t) = ?k"
+      by (simp add: gap_Suc(3))
+    with assms show False by simp
+  qed
+  then show "gap i (Suc t) = e_length (block i t)"
+    using gap_Suc(1) gap_Suc(2) by blast
+qed
+
+text \<open>Next up is the definition of $\tau$. In every iteration the
+process determines $\tau_i(x)$ for some $x$ either by appending 0 to the
+current block $b$, or by filling the current gap $k$. In the former case,
+the value is determined for $x = |b|$, in the latter for $x = k$.\<close>
+
+text \<open>For $i$ and $x$ the function @{term r_dettime} computes in which
+iteration the process for $i$ determines the value $\tau_i(x)$. This is the
+first iteration in which the block is long enough to contain position $x$ and
+in which $x$ is not the gap. If $\tau_i(x)$ is never determined, because Case~2 is
+reached with $k = x$, then @{term r_dettime} diverges.\<close>
+
+abbreviation determined :: "nat \<Rightarrow> nat \<Rightarrow> bool" where
+  "determined i x \<equiv> \<exists>t. x < e_length (block i t) \<and> x \<noteq> gap i t"
+
+lemma determined_0: "determined i 0"
+  using gap_gr0[of i 0] gap_in_block[of i 0] by force
+
+definition "r_dettime \<equiv>
+  Mn 2
+   (Cn 3 r_and
+     [Cn 3 r_less
+       [Id 3 2, Cn 3 r_length [Cn 3 r_pdec1 [Cn 3 r_state [Id 3 0, Id 3 1]]]],
+      Cn 3 r_neq
+       [Id 3 2, Cn 3 r_pdec2 [Cn 3 r_state [Id 3 0, Id 3 1]]]])"
+
+lemma r_dettime_recfn: "recfn 2 r_dettime"
+  unfolding r_dettime_def using r_state_recfn by simp
+
+abbreviation dettime :: partial2 where
+  "dettime i x \<equiv> eval r_dettime [i, x]"
+
+lemma r_dettime:
+  shows "determined i x \<Longrightarrow> dettime i x \<down>= (LEAST t. x < e_length (block i t) \<and> x \<noteq> gap i t)"
+    and "\<not> determined i x \<Longrightarrow> dettime i x \<up>"
+proof -
+  define f where "f =
+   (Cn 3 r_and
+     [Cn 3 r_less
+       [Id 3 2, Cn 3 r_length [Cn 3 r_pdec1 [Cn 3 r_state [Id 3 0, Id 3 1]]]],
+      Cn 3 r_neq
+       [Id 3 2, Cn 3 r_pdec2 [Cn 3 r_state [Id 3 0, Id 3 1]]]])"
+  then have "r_dettime = Mn 2 f"
+    unfolding f_def r_dettime_def by simp
+  have "recfn 3 f"
+    unfolding f_def using r_state_recfn by simp
+  then have "total f"
+    unfolding f_def using Cn_total r_state_total Mn_free_imp_total by simp
+  have f: "eval f [t, i, x] \<down>= (if x < e_length (block i t) \<and> x \<noteq> gap i t then 0 else 1)" for t
+  proof -
+    let ?b = "Cn 3 r_pdec1 [Cn 3 r_state [Id 3 0, Id 3 1]]"
+    let ?k = "Cn 3 r_pdec2 [Cn 3 r_state [Id 3 0, Id 3 1]]"
+    have "eval ?b [t, i, x] \<down>= pdec1 (the (eval r_state [t, i]))"
+      using r_state_recfn r_state_total by simp
+    then have b: "eval ?b [t, i, x] \<down>= block i t"
+      using block_def by simp
+    have "eval ?k [t, i, x] \<down>= pdec2 (the (eval r_state [t, i]))"
+      using r_state_recfn r_state_total by simp
+    then have k: "eval ?k [t, i, x] \<down>= gap i t"
+      using gap_def by simp
+    have "eval
+          (Cn 3 r_neq [Id 3 2, Cn 3 r_pdec2 [Cn 3 r_state [Id 3 0, Id 3 1]]])
+          [t, i, x] \<down>=
+       (if x \<noteq> gap i t then 0 else 1)"
+      using b k r_state_recfn r_state_total by simp
+    moreover have "eval
+          (Cn 3 r_less
+            [Id 3 2, Cn 3 r_length [Cn 3 r_pdec1 [Cn 3 r_state [Id 3 0, Id 3 1]]]])
+          [t, i, x] \<down>=
+       (if x < e_length (block i t) then 0 else 1)"
+      using b k r_state_recfn r_state_total by simp
+    ultimately show ?thesis
+      unfolding f_def using b k r_state_recfn r_state_total by simp
+  qed
+  {
+    assume "determined i x"
+    with f have "\<exists>t. eval f [t, i, x] \<down>= 0" by simp
+    then have "dettime i x \<down>= (LEAST t. eval f [t, i, x] \<down>= 0)"
+      using `total f` `r_dettime = Mn 2 f` r_dettime_recfn `recfn 3 f`
+        eval_Mn_total[of 2 f "[i, x]"]
+      by simp
+    then show "dettime i x \<down>= (LEAST t. x < e_length (block i t) \<and> x \<noteq> gap i t)"
+      using f by simp
+  next
+    assume "\<not> determined i x"
+    with f have "\<not> (\<exists>t. eval f [t, i, x] \<down>= 0)" by simp
+    then have "dettime i x \<up>"
+      using `total f` `r_dettime = Mn 2 f` r_dettime_recfn `recfn 3 f`
+        eval_Mn_total[of 2 f "[i, x]"]
+      by simp
+    with f show "dettime i x \<up>" by simp
+  }
+qed
+
+lemma r_dettimeI:
+  assumes "x < e_length (block i t) \<and> x \<noteq> gap i t"
+    and "\<And>T. x < e_length (block i T) \<and> x \<noteq> gap i T \<Longrightarrow> t \<le> T"
+  shows "dettime i x \<down>= t"
+proof -
+  let ?P = "\<lambda>T. x < e_length (block i T) \<and> x \<noteq> gap i T"
+  have "determined i x"
+    using assms(1) by auto
+  moreover have "Least ?P = t"
+    using assms Least_equality[of ?P t] by simp
+  ultimately show ?thesis using r_dettime by simp
+qed
+
+lemma r_dettime_0: "dettime i 0 \<down>= 0"
+  using r_dettimeI[of _ i 0] determined_0 gap_gr0[of i 0] gap_in_block[of i 0]
+  by fastforce
+
+text \<open>Computing the value of $\tau_i(x)$ works by running the process
+@{term r_state} for @{term "dettime i x"} iterations and taking the value at
+index $x$ of the resulting block.\<close>
+
+definition "r_tau \<equiv> Cn 2 r_nth [Cn 2 r_pdec1 [Cn 2 r_state [r_dettime, Id 2 0]], Id 2 1]"
+
+lemma r_tau_recfn: "recfn 2 r_tau"
+  unfolding r_tau_def using r_dettime_recfn r_state_recfn by simp
+
+abbreviation tau :: partial2 ("\<tau>") where
+  "\<tau> i x \<equiv> eval r_tau [i, x]"
+
+lemma tau_in_P2: "\<tau> \<in> \<P>\<^sup>2"
+  using r_tau_recfn by auto
+
+lemma tau_diverg:
+  assumes "\<not> determined i x"
+  shows "\<tau> i x \<up>"
+  unfolding r_tau_def using assms r_dettime r_dettime_recfn r_state_recfn by simp
+
+lemma tau_converg:
+  assumes "determined i x"
+  shows "\<tau> i x \<down>= e_nth (block i (the (dettime i x))) x"
+proof -
+  from assms obtain t where t: "dettime i x \<down>= t"
+    using r_dettime(1) by blast
+  then have "eval (Cn 2 r_state [r_dettime, Id 2 0]) [i, x] = eval r_state [t, i]"
+    using r_state_recfn r_dettime_recfn by simp
+  moreover have "eval r_state [t, i] \<down>"
+    using r_state_total r_state_recfn by simp
+  ultimately have "eval (Cn 2 r_pdec1 [Cn 2 r_state [r_dettime, Id 2 0]]) [i, x] =
+      eval r_pdec1 [the (eval r_state [t, i])]"
+    using r_state_recfn r_dettime_recfn by simp
+  then show ?thesis
+    unfolding r_tau_def using r_state_recfn r_dettime_recfn t block_def by simp
+qed
+
+lemma tau_converg':
+  assumes "dettime i x \<down>= t"
+  shows "\<tau> i x \<down>= e_nth (block i t) x"
+  using assms tau_converg[of x i] r_dettime(2)[of x i] by fastforce
+
+lemma tau_at_0: "\<tau> i 0 \<down>= i"
+proof -
+  have "\<tau> i 0 \<down>= e_nth (block i 0) 0"
+    using tau_converg'[OF r_dettime_0] by simp
+  then show ?thesis using block_def by (simp add: r_state_at_0)
+qed
+
+lemma state_unchanged:
+  assumes "gap i t - 1 \<le> y" and "y \<le> t"
+  shows "gap i t = gap i y"
+proof -
+  have "gap i t = gap i (gap i t - 1)"
+  proof (induction t)
+    case 0
+    then show ?case by (simp add: gap_def r_state_at_0)
+  next
+    case (Suc t)
+    show ?case
+    proof (cases "gap i (Suc t) = t + 2")
+      case True
+      then show ?thesis by simp
+    next
+      case False
+      then show ?thesis
+        using Suc state_change_on_either(2) length_block by force
+    qed
+  qed
+  moreover have "gap i (gap i t - 1) \<le> gap i y"
+    using assms(1) gap_monotone by simp
+  moreover have "gap i y \<le> gap i t"
+    using assms(2) gap_monotone by simp
+  ultimately show ?thesis by simp
+qed
+
+text \<open>The values of the non-gap indices $x$ of every block created in
+the diagonalization process equal $\tau_i(x)$.\<close>
+
+lemma tau_eq_state:
+  assumes "j < e_length (block i t)" and "j \<noteq> gap i t"
+  shows "\<tau> i j \<down>= e_nth (block i t) j"
+  using assms
+proof (induction t)
+  case 0
+  then have "j = 0"
+    using gap_gr0[of i 0] gap_in_block[of i 0] length_block[of i 0] by simp
+  then have "\<tau> (e_hd (block i t)) j \<down>= e_nth (block i (the (dettime i 0))) 0"
+    using determined_0 tau_converg hd_block by simp
+  then have "\<tau> (e_hd (block i t)) j \<down>= e_nth (block i 0) 0"
+    using r_dettime_0 by simp
+  then show ?case using \<open>j = 0\<close> r_dettime_0 tau_converg' by simp
+next
+  case (Suc t)
+  let ?b = "block i t"
+  let ?bb = "block i (Suc t)"
+  let ?k = "gap i t"
+  let ?kk = "gap i (Suc t)"
+  show ?case
+  proof (cases "?kk = ?k")
+    case kk_eq_k: True
+    then have bb_b0: "?bb = e_snoc ?b 0"
+      using state_change_on_neither by simp
+    show "\<tau> i j \<down>= e_nth ?bb j"
+    proof (cases "j < e_length ?b")
+      case True
+      then have "e_nth ?bb j = e_nth ?b j"
+        using bb_b0 by (simp add: nth_append)
+      moreover have "j \<noteq> ?k"
+        using Suc kk_eq_k by simp
+      ultimately show ?thesis using Suc True by simp
+    next
+      case False
+      then have j: "j = e_length ?b"
+        using Suc.prems(1) length_block by auto
+      then have "e_nth ?bb j = 0"
+        using bb_b0 by simp
+      have "dettime i j \<down>= Suc t"
+      proof (rule r_dettimeI)
+        show "j < e_length ?bb \<and> j \<noteq> ?kk"
+          using Suc.prems(1,2) by linarith
+        show "\<And>T. j < e_length (block i T) \<and> j \<noteq> gap i T \<Longrightarrow> Suc t \<le> T"
+          using length_block j by simp
+      qed
+      with tau_converg' show ?thesis by simp
+    qed
+  next
+    case False
+    then have kk_lenb: "?kk = e_length ?b"
+      using state_change_on_either by simp
+    then show ?thesis
+    proof (cases "j = ?k")
+      case j_eq_k: True
+      have "dettime i j \<down>= Suc t"
+      proof (rule r_dettimeI)
+        show "j < e_length ?bb \<and> j \<noteq> ?kk"
+          using Suc.prems(1,2) by simp
+        show "Suc t \<le> T" if "j < e_length (block i T) \<and> j \<noteq> gap i T" for T
+        proof (rule ccontr)
+          assume "\<not> (Suc t \<le> T)"
+          then have "T < Suc t" by simp
+          then show False
+          proof (cases "T < ?k - 1")
+            case True
+            then have "e_length (block i T) = T + 2"
+              using length_block by simp
+            then have "e_length (block i T) < ?k + 1"
+              using True by simp
+            then have "e_length (block i T) \<le> ?k" by simp
+            then have "e_length (block i T) \<le> j"
+              using j_eq_k by simp
+            then show False
+              using that by simp
+          next
+            case False
+            then have "?k - 1 \<le> T" and "T \<le> t"
+              using `T < Suc t` by simp_all
+            with state_unchanged have "gap i t = gap i T" by blast
+            then show False
+              using j_eq_k that by simp
+          qed
+        qed
+      qed
+      then show ?thesis using tau_converg' by simp
+    next
+      case False
+      then have "j < e_length ?b"
+        using kk_lenb Suc.prems(1,2) length_block by auto
+      then show ?thesis using Suc False block_stable by fastforce
+    qed
+  qed
+qed
+
+lemma tau_eq_state':
+  assumes "j < t + 2" and " j \<noteq> gap i t"
+  shows "\<tau> i j \<down>= e_nth (block i t) j"
+  using assms tau_eq_state length_block by simp
+
+text \<open>We now consider the two cases described in the proof sketch.
+In Case~2 there is a gap that never gets filled, or equivalently there is
+a rightmost gap.\<close>
+
+abbreviation "case_two i \<equiv> (\<exists>t. \<forall>T. gap i T \<le> gap i t)"
+
+abbreviation "case_one i \<equiv> \<not> case_two i"
+
+text \<open>Another characterization of Case~2 is that from some iteration on
+only @{term change_on_neither} holds.\<close>
+
+lemma case_two_iff_forever_neither:
+  "case_two i \<longleftrightarrow> (\<exists>t. \<forall>T\<ge>t. change_on_neither (block i T) (gap i T))"
+proof
+  assume "\<exists>t. \<forall>T\<ge>t. change_on_neither (block i T) (gap i T)"
+  then obtain t where t: "\<forall>T\<ge>t. change_on_neither (block i T) (gap i T)"
+    by auto
+  have "(gap i T) \<le> (gap i t)" for T
+  proof (cases "T \<le> t")
+    case True
+    then show ?thesis using gap_monotone by simp
+  next
+    case False
+    then show ?thesis
+    proof (induction T)
+      case 0
+      then show ?case by simp
+    next
+      case (Suc T)
+      with t have "change_on_neither ((block i T)) ((gap i T))"
+        by simp
+      then show ?case
+        using Suc.IH state_change_on_either(1)[of i T] gap_monotone[of T t i]
+        by metis
+    qed
+  qed
+  then show "\<exists>t. \<forall>T. gap i T \<le> gap i t"
+    by auto
+next
+  assume "\<exists>t. \<forall>T. gap i T \<le> gap i t"
+  then obtain t where t: "\<forall>T. gap i T \<le> gap i t"
+    by auto
+  have "change_on_neither (block i T) (gap i T)" if "T\<ge>t" for T
+  proof -
+    have T: "(gap i T) \<ge> (gap i t)"
+      using gap_monotone that by simp
+    show ?thesis
+    proof (rule ccontr)
+      assume "\<not> change_on_neither (block i T) (gap i T)"
+      then have "change_on_0 (block i T) (gap i T) \<or> change_on_1 (block i T) (gap i T)"
+        by simp
+      then have "gap i (Suc T) > gap i T"
+        using gap_le_Suc[of i] state_change_on_either(2)[of i] state_change_on_neither(1)[of i]
+          dual_order.strict_iff_order
+        by blast
+      with T have "gap i (Suc T) > gap i t" by simp
+      with t show False
+        using not_le by auto
+    qed
+  qed
+  then show "\<exists>t. \<forall>T\<ge>t. change_on_neither (block i T) (gap i T)"
+    by auto
+qed
+
+text \<open>In Case~1, $\tau_i$ is total.\<close>
+
+lemma case_one_tau_total:
+  assumes "case_one i"
+  shows "\<tau> i x \<down>"
+proof (cases "x = gap i x")
+  case True
+  from assms have "\<forall>t. \<exists>T. gap i T > gap i t"
+    using le_less_linear gap_def[of i x] by blast
+  then obtain T where T: "gap i T > gap i x"
+    by auto
+  then have "T > x"
+    using gap_monotone leD le_less_linear by blast
+  then have "x < T + 2" by simp
+  moreover from T True have "x \<noteq> gap i T" by simp
+  ultimately show ?thesis using tau_eq_state' by simp
+next
+  case False
+  moreover have "x < x + 2" by simp
+  ultimately show ?thesis using tau_eq_state' by blast
+qed
+
+text \<open>In Case~2, $\tau_i$ is undefined only at the gap that never gets filled.\<close>
+
+lemma case_two_tau_not_quite_total:
+  assumes "\<forall>T. gap i T \<le> gap i t"
+  shows "\<tau> i (gap i t) \<up>"
+    and "x \<noteq> gap i t \<Longrightarrow> \<tau> i x \<down>"
+proof -
+  let ?k = "gap i t"
+  have "\<not> determined i ?k"
+  proof
+    assume "determined i ?k"
+    then obtain T where T: "?k < e_length (block i T) \<and> ?k \<noteq> gap i T"
+      by auto
+    with assms have snd_le: "gap i T < ?k"
+      by (simp add: dual_order.strict_iff_order)
+    then have "T < t"
+      using gap_monotone by (metis leD le_less_linear)
+    from T length_block have "?k < T + 2" by simp
+    moreover have "?k \<noteq> T + 1"
+      using T state_change_on_either(2) \<open>T < t\<close> state_unchanged
+      by (metis Suc_eq_plus1 Suc_leI add_diff_cancel_right' le_add1 nat_neq_iff)
+    ultimately have "?k \<le> T" by simp
+    then have "gap i T = gap i ?k"
+      using state_unchanged[of i T "?k"] \<open>?k < T + 2\<close> snd_le by simp
+    then show False
+      by (metis diff_le_self state_unchanged leD nat_le_linear gap_monotone snd_le)
+  qed
+  with tau_diverg show "\<tau> i ?k \<up>" by simp
+
+  assume "x \<noteq> ?k"
+  show "\<tau> i x \<down>"
+  proof (cases "x < t + 2")
+    case True
+    with `x \<noteq> ?k` tau_eq_state' show ?thesis by simp
+  next
+    case False
+    then have "gap i x = ?k"
+      using assms by (simp add: dual_order.antisym gap_monotone)
+    with `x \<noteq> ?k` have "x \<noteq> gap i x" by simp
+    then show ?thesis using tau_eq_state'[of x x] by simp
+  qed
+qed
+
+lemma case_two_tau_almost_total:
+  assumes "\<exists>t. \<forall>T. gap i T \<le> gap i t" (is "\<exists>t. ?P t")
+  shows "\<tau> i (gap i (Least ?P)) \<up>"
+    and "x \<noteq> gap i (Least ?P) \<Longrightarrow> \<tau> i x \<down>"
+proof -
+  from assms have "?P (Least ?P)"
+    using LeastI_ex[of ?P] by simp
+  then show "\<tau> i (gap i (Least ?P)) \<up>" and "x \<noteq> gap i (Least ?P) \<Longrightarrow> \<tau> i x \<down>"
+    using case_two_tau_not_quite_total by simp_all
+qed
+
+text \<open>Some more properties of $\tau$.\<close>
+
+lemma init_tau_gap: "(\<tau> i) \<triangleright> (gap i t - 1) = e_take (gap i t) (block i t)"
+proof (intro initI')
+  show 1: "e_length (e_take (gap i t) (block i t)) = Suc (gap i t - 1)"
+  proof -
+    have "gap i t > 0"
+      using gap_gr0 by simp
+    moreover have "gap i t < e_length (block i t)"
+      using gap_in_block by simp
+    ultimately have "e_length (e_take (gap i t) (block i t)) = gap i t"
+      by simp
+    then show ?thesis using gap_gr0 by simp
+  qed
+  show "\<tau> i x \<down>= e_nth (e_take (gap i t) (block i t)) x" if "x < Suc (gap i t - 1)" for x
+  proof -
+    have x_le: "x < gap i t"
+      using that gap_gr0 by simp
+    then have "x < e_length (block i t)"
+      using gap_in_block less_trans by blast
+    then have *: "\<tau> i x \<down>= e_nth (block i t) x"
+      using x_le tau_eq_state by auto
+    have "x < e_length (e_take (gap i t) (block i t))"
+      using x_le 1 by simp
+    then have "e_nth (block i t) x = e_nth (e_take (gap i t) (block i t)) x"
+      using x_le by simp
+    then show ?thesis using * by simp
+  qed
+qed
+
+lemma change_on_0_init_tau:
+  assumes "change_on_0 (block i t) (gap i t)"
+  shows "(\<tau> i) \<triangleright> (t + 1) = block i t"
+proof (intro initI')
+  let ?b = "block i t" and ?k = "gap i t"
+  show "e_length (block i t) = Suc (t + 1)"
+    using length_block by simp
+  show "(\<tau> i) x \<down>= e_nth (block i t) x" if "x < Suc (t + 1)" for x
+  proof (cases "x = ?k")
+    case True
+    have "gap i (Suc t) = e_length ?b" and b: "block i (Suc t) = e_snoc ?b 0"
+      using gap_Suc(1) block_Suc(1) assms by simp_all
+    then have "x < e_length (block i (Suc t))" "x \<noteq> gap i (Suc t)"
+      using that length_block by simp_all
+    then have "\<tau> i x \<down>= e_nth (block i (Suc t)) x"
+      using tau_eq_state by simp
+    then show ?thesis using that assms b by (simp add: nth_append)
+  next
+    case False
+    then show ?thesis using that assms tau_eq_state' by simp
+  qed
+qed
+
+lemma change_on_0_hyp_change:
+  assumes "change_on_0 (block i t) (gap i t)"
+  shows "\<sigma> i ((\<tau> i) \<triangleright> (t + 1)) \<noteq> \<sigma> i ((\<tau> i) \<triangleright> (gap i t - 1))"
+  using assms hd_block init_tau_gap change_on_0_init_tau by simp
+
+lemma change_on_1_init_tau:
+  assumes "change_on_1 (block i t) (gap i t)"
+  shows "(\<tau> i) \<triangleright>  (t + 1) = e_update (block i t) (gap i t) 1"
+proof (intro initI')
+  let ?b = "block i t" and ?k = "gap i t"
+  show "e_length (e_update ?b ?k 1) = Suc (t + 1)"
+    using length_block by simp
+  show "(\<tau> i) x \<down>= e_nth (e_update ?b ?k 1) x" if "x < Suc (t + 1)" for x
+  proof (cases "x = ?k")
+    case True
+    have "gap i (Suc t) = e_length ?b" and b: "block i (Suc t) = e_snoc (e_update ?b ?k 1) 0"
+      using gap_Suc(2) block_Suc(2) assms by simp_all
+    then have "x < e_length (block i (Suc t))" "x \<noteq> gap i (Suc t)"
+      using that length_block by simp_all
+    then have "\<tau> i x \<down>= e_nth (block i (Suc t)) x"
+      using tau_eq_state by simp
+    then show ?thesis using that assms b nth_append by (simp add: nth_append)
+  next
+    case False
+    then show ?thesis using that assms tau_eq_state' by simp
+  qed
+qed
+
+lemma change_on_1_hyp_change:
+  assumes "change_on_1 (block i t) (gap i t)"
+  shows "\<sigma> i ((\<tau> i) \<triangleright> (t + 1)) \<noteq> \<sigma> i ((\<tau> i) \<triangleright> (gap i t - 1))"
+  using assms hd_block init_tau_gap change_on_1_init_tau by simp
+
+lemma change_on_either_hyp_change:
+  assumes "\<not> change_on_neither (block i t) (gap i t)"
+  shows "\<sigma> i ((\<tau> i) \<triangleright> (t + 1)) \<noteq> \<sigma> i ((\<tau> i) \<triangleright> (gap i t - 1))"
+  using assms change_on_0_hyp_change change_on_1_hyp_change by auto
+
+lemma filled_gap_0_init_tau:
+  assumes "f\<^sub>0 = (\<tau> i)((gap i t):=Some 0)"
+  shows "f\<^sub>0 \<triangleright> (t + 1) = block i t"
+proof (intro initI')
+  show len: "e_length (block i t) = Suc (t + 1)"
+    using assms length_block by auto
+  show "f\<^sub>0 x \<down>= e_nth (block i t) x" if "x < Suc (t + 1)" for x
+  proof (cases "x = gap i t")
+    case True
+    then show ?thesis using assms last_block by auto
+  next
+    case False
+    then show ?thesis using assms len tau_eq_state that by auto
+  qed
+qed
+
+lemma filled_gap_1_init_tau:
+  assumes "f\<^sub>1 = (\<tau> i)((gap i t):=Some 1)"
+  shows "f\<^sub>1 \<triangleright> (t + 1) = e_update (block i t) (gap i t) 1"
+proof (intro initI')
+  show len: "e_length (e_update (block i t) (gap i t) 1) = Suc (t + 1)"
+    using e_length_update length_block by simp
+  show "f\<^sub>1 x \<down>= e_nth (e_update (block i t) (gap i t) 1) x" if "x < Suc (t + 1)" for x
+  proof (cases "x = gap i t")
+    case True
+    moreover have "gap i t < e_length (block i t)"
+      using gap_in_block by simp
+    ultimately show ?thesis using assms by simp
+  next
+    case False
+    then show ?thesis using assms len tau_eq_state that by auto
+  qed
+qed
+
+
+subsection \<open>The separating class\<close>
+
+text \<open>Next we define the sets $V_i$ from the introductory proof sketch
+(page~\pageref{s:lim_bc}).\<close>
+
+definition V_bclim :: "nat \<Rightarrow> partial1 set" where
+  "V_bclim i \<equiv>
+    if case_two i
+    then let k = gap i (LEAST t. \<forall>T. gap i T \<le> gap i t)
+         in {(\<tau> i)(k:=Some 0), (\<tau> i)(k:=Some 1)}
+    else {\<tau> i}"
+
+lemma V_subseteq_R1: "V_bclim i \<subseteq> \<R>"
+proof (cases "case_two i")
+  case True
+  define k where "k = gap i (LEAST t. \<forall>T. gap i T \<le> gap i t)"
+  have "\<tau> i \<in> \<P>"
+    using tau_in_P2 P2_proj_P1 by auto
+  then have "(\<tau> i)(k:=Some 0) \<in> \<P>" and "(\<tau> i)(k:=Some 1) \<in> \<P>"
+    using P1_update_P1 by simp_all
+  moreover have "total1 ((\<tau> i)(k:=Some v))" for v
+     using case_two_tau_almost_total(2)[OF True] k_def total1_def by simp
+  ultimately have "(\<tau> i)(k:=Some 0) \<in> \<R>" and "(\<tau> i)(k:=Some 1) \<in> \<R>"
+    using P1_total_imp_R1 by simp_all
+  moreover have "V_bclim i = {(\<tau> i)(k:=Some 0), (\<tau> i)(k:=Some 1)}"
+    using True V_bclim_def k_def by (simp add: Let_def)
+  ultimately show ?thesis by simp
+next
+  case False
+  have "V_bclim i = {\<tau> i}"
+    unfolding V_bclim_def by (simp add: False)
+  moreover have "\<tau> i \<in> \<R>"
+    using total1I case_one_tau_total[OF False] tau_in_P2 P2_proj_P1[of \<tau>] P1_total_imp_R1
+    by simp
+  ultimately show ?thesis by simp
+qed
+
+lemma case_one_imp_gap_unbounded:
+  assumes "case_one i"
+  shows "\<exists>t. gap i t - 1 > n"
+proof (induction n)
+  case 0
+  then show ?case
+    using assms gap_gr0[of i] state_at_0(2)[of i] by (metis diff_is_0_eq gr_zeroI)
+next
+  case (Suc n)
+  then obtain t where t: "gap i t - 1 > n"
+    by auto
+  moreover from assms have "\<forall>t. \<exists>T. gap i T > gap i t"
+    using leI by blast
+  ultimately obtain T where "gap i T > gap i t"
+    by auto
+  then have "gap i T - 1 > gap i t - 1"
+    using gap_gr0[of i] by (simp add: Suc_le_eq diff_less_mono)
+  with t have "gap i T - 1 > Suc n" by simp
+  then show ?case by auto
+qed
+
+lemma case_one_imp_not_learn_lim_V:
+  assumes "case_one i"
+  shows "\<not> learn_lim \<phi> (V_bclim i) (\<sigma> i)"
+proof -
+  have V_bclim: "V_bclim i = {\<tau> i}"
+    using assms V_bclim_def by (auto simp add: Let_def)
+  have "\<exists>m\<^sub>1>n. \<exists>m\<^sub>2>n. (\<sigma> i) ((\<tau> i) \<triangleright> m\<^sub>1) \<noteq> (\<sigma> i) ((\<tau> i) \<triangleright> m\<^sub>2)" for n
+  proof -
+    obtain t where t: "gap i t - 1 > n"
+      using case_one_imp_gap_unbounded[OF assms] by auto
+    moreover have "\<forall>t. \<exists>T\<ge>t. \<not> change_on_neither (block i T) (gap i T)"
+      using assms case_two_iff_forever_neither by blast
+    ultimately obtain T where T: "T \<ge> t" "\<not> change_on_neither (block i T) (gap i T)"
+      by auto
+    then have "(\<sigma> i) ((\<tau> i) \<triangleright> (T + 1)) \<noteq> (\<sigma> i) ((\<tau> i) \<triangleright> (gap i T - 1))"
+      using change_on_either_hyp_change by simp
+    moreover have "gap i T - 1 > n"
+      using t T(1) gap_monotone by (simp add: diff_le_mono less_le_trans)
+    moreover have "T + 1 > n"
+    proof -
+      have "gap i T - 1 \<le> T"
+        using gap_in_block length_block by (simp add: le_diff_conv less_Suc_eq_le)
+      then show ?thesis using `gap i T - 1 > n` by simp
+    qed
+    ultimately show ?thesis by auto
+  qed
+  with infinite_hyp_changes_not_Lim V_bclim show ?thesis by simp
+qed
+
+lemma case_two_imp_not_learn_lim_V:
+  assumes "case_two i"
+  shows "\<not> learn_lim \<phi> (V_bclim i) (\<sigma> i)"
+proof -
+  let ?P = "\<lambda>t. \<forall>T. (gap i T) \<le> (gap i t)"
+  let ?t = "LEAST t. ?P t"
+  let ?k = "gap i ?t"
+  let ?b = "e_take ?k (block i ?t)"
+  have t: "\<forall>T. gap i T \<le> gap i ?t"
+    using assms LeastI_ex[of ?P] by simp
+  then have neither: "\<forall>T\<ge>?t. change_on_neither (block i T) (gap i T)"
+    using gap_le_Suc gap_monotone state_change_on_neither(1)
+    by (metis (no_types, lifting) antisym)
+  have gap_T: "\<forall>T\<ge>?t. gap i T = ?k"
+    using t gap_monotone antisym_conv by blast
+  define f\<^sub>0 where "f\<^sub>0 = (\<tau> i)(?k:=Some 0)"
+  define f\<^sub>1 where "f\<^sub>1 = (\<tau> i)(?k:=Some 1)"
+  show ?thesis
+  proof (rule same_hyp_for_two_not_Lim)
+    show "f\<^sub>0 \<in> V_bclim i" and "f\<^sub>1 \<in> V_bclim i"
+      using assms V_bclim_def f\<^sub>0_def f\<^sub>1_def by (simp_all add: Let_def)
+    show "f\<^sub>0 \<noteq> f\<^sub>1" using f\<^sub>0_def f\<^sub>1_def by (meson map_upd_eqD1 zero_neq_one)
+    show "\<forall>n\<ge>Suc ?t. \<sigma> i (f\<^sub>0 \<triangleright> n) = \<sigma> i ?b"
+    proof -
+      have "\<sigma> i (block i T) = \<sigma> i (e_take ?k (block i T))" if "T \<ge> ?t" for T
+        using that gap_T neither hd_block by metis
+      then have "\<sigma> i (block i T) = \<sigma> i ?b" if "T \<ge> ?t" for T
+        by (metis (no_types, lifting) init_tau_gap gap_T that)
+      then have "\<sigma> i (f\<^sub>0 \<triangleright> (T + 1)) = \<sigma> i ?b" if "T \<ge> ?t" for T
+        using filled_gap_0_init_tau[of f\<^sub>0 i T] f\<^sub>0_def gap_T that
+        by (metis (no_types, lifting))
+      then have "\<sigma> i (f\<^sub>0 \<triangleright> T) = \<sigma> i ?b" if "T \<ge> Suc ?t" for T
+        using that by (metis (no_types, lifting) Suc_eq_plus1 Suc_le_D Suc_le_mono)
+      then show ?thesis by simp
+    qed
+    show "\<forall>n\<ge>Suc ?t. \<sigma> i (f\<^sub>1 \<triangleright> n) = \<sigma> i ?b"
+    proof -
+      have "\<sigma> i (e_update (block i T) ?k 1) = \<sigma> i (e_take ?k (block i T))" if "T \<ge> ?t" for T
+        using neither by (metis (no_types, lifting) hd_block gap_T that)
+      then have "\<sigma> i (e_update (block i T) ?k 1) = \<sigma> i ?b" if "T \<ge> ?t" for T
+        using that init_tau_gap[of i] gap_T by (metis (no_types, lifting))
+      then have "\<sigma> i (f\<^sub>1 \<triangleright> (T + 1)) = \<sigma> i ?b" if "T \<ge> ?t" for T
+        using filled_gap_1_init_tau[of f\<^sub>1 i T] f\<^sub>1_def gap_T that
+        by (metis (no_types, lifting))
+      then have "\<sigma> i (f\<^sub>1 \<triangleright> T) = \<sigma> i ?b" if "T \<ge> Suc ?t" for T
+        using that by (metis (no_types, lifting) Suc_eq_plus1 Suc_le_D Suc_le_mono)
+      then show ?thesis by simp
+    qed
+  qed
+qed
+
+corollary not_learn_lim_V: "\<not> learn_lim \<phi> (V_bclim i) (\<sigma> i)"
+  using case_one_imp_not_learn_lim_V case_two_imp_not_learn_lim_V
+  by (cases "case_two i") simp_all
+
+text \<open>Next we define the separating class.\<close>
+
+definition V_BCLIM :: "partial1 set" ("V\<^bsub>BC-LIM\<^esub>") where
+  "V\<^bsub>BC-LIM\<^esub> \<equiv> \<Union>i. V_bclim i"
+
+lemma V_BCLIM_R1: "V\<^bsub>BC-LIM\<^esub> \<subseteq> \<R>"
+  using V_BCLIM_def V_subseteq_R1 by auto
+
+lemma V_BCLIM_not_in_Lim: "V\<^bsub>BC-LIM\<^esub> \<notin> LIM"
+proof
+  assume "V\<^bsub>BC-LIM\<^esub> \<in> LIM"
+  then obtain s where s: "learn_lim \<phi> V\<^bsub>BC-LIM\<^esub> s"
+    using learn_lim_wrt_goedel[OF goedel_numbering_phi] Lim_def by blast
+  moreover obtain i where "\<phi> i = s"
+    using s learn_limE(1) phi_universal by blast
+  ultimately have "learn_lim \<phi> V\<^bsub>BC-LIM\<^esub> (\<lambda>x. eval r_sigma [i, x])"
+    using learn_lim_sigma by simp
+  moreover have "V_bclim i \<subseteq> V\<^bsub>BC-LIM\<^esub>"
+    using V_BCLIM_def by auto
+  ultimately have "learn_lim \<phi> (V_bclim i) (\<lambda>x. eval r_sigma [i, x])"
+    using learn_lim_closed_subseteq by simp
+  then show False
+    using not_learn_lim_V by simp
+qed
+
+
+subsection \<open>The separating class is in BC\<close>
+
+text \<open>In order to show @{term "V\<^bsub>BC-LIM\<^esub> \<in> BC"} we
+define a hypothesis space that for every function $\tau_i$ and every list $b$
+of numbers contains a copy of $\tau_i$ with the first $|b|$ values replaced
+by $b$.\<close>
+
+definition psitau :: partial2 ("\<psi>\<^sup>\<tau>") where
+  "\<psi>\<^sup>\<tau> b x \<equiv> (if x < e_length b then Some (e_nth b x) else \<tau> (e_hd b) x)"
+
+lemma psitau_in_P2: "\<psi>\<^sup>\<tau> \<in> \<P>\<^sup>2"
+proof -
+  define r where "r \<equiv>
+    Cn 2
+     (r_lifz r_nth (Cn 2 r_tau [Cn 2 r_hd [Id 2 0], Id 2 1]))
+     [Cn 2 r_less [Id 2 1, Cn 2 r_length [Id 2 0]], Id 2 0, Id 2 1]"
+  then have "recfn 2 r"
+    using r_tau_recfn by simp
+  moreover have "eval r [b, x] = \<psi>\<^sup>\<tau> b x" for b x
+  proof -
+    let ?f = "Cn 2 r_tau [Cn 2 r_hd [Id 2 0], Id 2 1]"
+    have "recfn 2 r_nth" "recfn 2 ?f"
+      using r_tau_recfn by simp_all
+    then have "eval (r_lifz r_nth ?f) [c, b, x] =
+        (if c = 0 then eval r_nth [b, x] else eval ?f [b, x])" for c
+      by simp
+    moreover have "eval r_nth [b, x] \<down>= e_nth b x"
+      by simp
+    moreover have "eval ?f [b, x] = \<tau> (e_hd b) x"
+      using r_tau_recfn by simp
+    ultimately have "eval (r_lifz r_nth ?f) [c, b, x] =
+        (if c = 0 then Some (e_nth b x) else \<tau> (e_hd b) x)" for c
+      by simp
+    moreover have "eval (Cn 2 r_less [Id 2 1, Cn 2 r_length [Id 2 0]]) [b, x] \<down>=
+        (if x < e_length b then 0 else 1)"
+      by simp
+    ultimately show ?thesis
+      unfolding r_def psitau_def using r_tau_recfn by simp
+  qed
+  ultimately show ?thesis by auto
+qed
+
+lemma psitau_init:
+  "\<psi>\<^sup>\<tau> (f \<triangleright> n) x = (if x < Suc n then Some (the (f x)) else \<tau> (the (f 0)) x)"
+proof -
+  let ?e = "f \<triangleright> n"
+  have "e_length ?e = Suc n" by simp
+  moreover have "x < Suc n \<Longrightarrow> e_nth ?e x = the (f x)" by simp
+  moreover have "e_hd ?e = the (f 0)"
+    using hd_init by simp
+  ultimately show ?thesis using psitau_def by simp
+qed
+
+text \<open>The class @{term V_BCLIM} can be learned BC-style in the
+hypothesis space @{term psitau} by the identity function.\<close>
+
+lemma learn_bc_V_BCLIM: "learn_bc \<psi>\<^sup>\<tau> V\<^bsub>BC-LIM\<^esub> Some"
+proof (rule learn_bcI)
+  show "environment \<psi>\<^sup>\<tau> V\<^bsub>BC-LIM\<^esub> Some"
+    using identity_in_R1 V_BCLIM_R1 psitau_in_P2 by auto
+  show "\<exists>n\<^sub>0. \<forall>n\<ge>n\<^sub>0. \<psi>\<^sup>\<tau> (the (Some (f \<triangleright> n))) = f" if "f \<in> V\<^bsub>BC-LIM\<^esub>" for f
+  proof -
+    from that V_BCLIM_def obtain i where i: "f \<in> V_bclim i"
+      by auto
+    show ?thesis
+    proof (cases "case_two i")
+      case True
+      let ?P = "\<lambda>t. \<forall>T. (gap i T) \<le> (gap i t)"
+      let ?lmin = "LEAST t. ?P t"
+      define k where "k \<equiv> gap i ?lmin"
+      have V_bclim: "V_bclim i = {(\<tau> i)(k:=Some 0), (\<tau> i)(k:=Some 1)}"
+        using True V_bclim_def k_def by (simp add: Let_def)
+      moreover have "0 < k"
+        using gap_gr0[of i] k_def by simp
+      ultimately have "f 0 \<down>= i"
+        using tau_at_0[of i] i by auto
+      have "\<psi>\<^sup>\<tau> (f \<triangleright> n) = f" if "n \<ge> k" for n
+      proof
+        fix x
+        show "\<psi>\<^sup>\<tau> (f \<triangleright> n) x = f x"
+        proof (cases "x \<le> n")
+          case True
+          then show ?thesis
+            using R1_imp_total1 V_subseteq_R1 i psitau_init by fastforce
+        next
+          case False
+          then have "\<psi>\<^sup>\<tau> (f \<triangleright> n) x = \<tau> (the (f 0)) x"
+            using psitau_init by simp
+          then have "\<psi>\<^sup>\<tau> (f \<triangleright> n) x = \<tau> i x"
+            using `f 0 \<down>= i` by simp
+          moreover have "f x = \<tau> i x"
+            using False V_bclim i that by auto
+          ultimately show ?thesis by simp
+        qed
+      qed
+      then show ?thesis by auto
+    next
+      case False
+      then have "V_bclim i = {\<tau> i}"
+        using V_bclim_def by (auto simp add: Let_def)
+      then have f: "f = \<tau> i"
+        using i by simp
+      have "\<psi>\<^sup>\<tau> (f \<triangleright> n) = f" for n
+      proof
+        fix x
+        show "\<psi>\<^sup>\<tau> (f \<triangleright> n) x = f x"
+        proof (cases "x \<le> n")
+          case True
+          then show ?thesis
+            using R1_imp_total1 V_BCLIM_R1 psitau_init that by auto
+        next
+          case False
+          then show ?thesis by (simp add: f psitau_init tau_at_0)
+        qed
+      qed
+      then show ?thesis by simp
+    qed
+  qed
+qed
+
+text \<open>Finally, the main result of this section:\<close>
+
+theorem Lim_subset_BC: "LIM \<subset> BC"
+  using learn_bc_V_BCLIM BC_def Lim_subseteq_BC V_BCLIM_not_in_Lim by auto
+
+end
diff --git a/thys/Inductive_Inference/Lemma_R.thy b/thys/Inductive_Inference/Lemma_R.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/Lemma_R.thy
@@ -0,0 +1,2114 @@
+section \<open>Lemma R\label{s:lemma_r}\<close>
+
+theory Lemma_R
+  imports Inductive_Inference_Basics
+begin
+
+text \<open>A common technique for constructing a class that cannot be
+learned is diagonalization against all strategies (see, for instance,
+Section~\ref{s:lim_bc}). Similarly, the typical way of proving that a class
+cannot be learned is by assuming there is a strategy and deriving a
+contradiction. Both techniques are easier to carry out if one has to consider
+only \emph{total} recursive strategies. This is not possible in general,
+since after all the definitions of the inference types admit strictly partial
+strategies. However, for many inference types one can show that for every
+strategy there is a total strategy with at least the same ``learning power''.
+Results to that effect are called Lemma~R.
+
+Lemma~R comes in different strengths depending on how general the
+construction of the total recursive strategy is. CONS is the only inference
+type considered here for which not even a weak form of Lemma~R holds.\<close>
+
+
+subsection \<open>Strong Lemma R for LIM, FIN, and BC\<close>
+
+text \<open>In its strong form Lemma~R says that for any strategy $S$, there
+is a total strategy $T$ that learns all classes $S$ learns regardless of
+hypothesis space. The strategy $T$ can be derived from $S$ by a delayed
+simulation of $S$. More precisely, for input $f^n$, $T$ simulates $S$ for
+prefixes $f^0, f^1, \ldots, f^n$ for at most $n$ steps. If $S$ halts on none
+of the prefixes, $T$ outputs an arbitrary hypothesis. Otherwise let $k \leq
+n$ be maximal such that $S$ halts on $f^k$ in at most $n$ steps. Then $T$
+outputs $S(f^k)$. \<close>
+
+text \<open>We reformulate some lemmas for @{term r_result1} to make it easier
+to use them with @{term "\<phi>"}.\<close>
+
+lemma r_result1_converg_phi:
+  assumes "\<phi> i x \<down>= v"
+  shows "\<exists>t.
+    (\<forall>t'\<ge>t. eval r_result1 [t', i, x] \<down>= Suc v) \<and> 
+    (\<forall>t'<t. eval r_result1 [t', i, x] \<down>= 0)"
+  using assms r_result1_converg' phi_def by simp_all
+
+lemma r_result1_bivalent':
+  assumes "eval r_phi [i, x] \<down>= v"
+  shows "eval r_result1 [t, i, x] \<down>= Suc v \<or> eval r_result1 [t, i, x] \<down>= 0"
+  using assms r_result1 r_result_bivalent' r_phi'' by simp
+
+lemma r_result1_bivalent_phi:
+  assumes "\<phi> i x \<down>= v"
+  shows "eval r_result1 [t, i, x] \<down>= Suc v \<or> eval r_result1 [t, i, x] \<down>= 0"
+  using assms r_result1_bivalent' phi_def by simp_all
+
+lemma r_result1_diverg_phi:
+  assumes "\<phi> i x \<up>"
+  shows "eval r_result1 [t, i, x] \<down>= 0"
+  using assms phi_def r_result1_diverg' by simp
+
+lemma r_result1_some_phi:
+  assumes "eval r_result1 [t, i, x] \<down>= Suc v"
+  shows "\<phi> i x \<down>= v"
+  using assms phi_def r_result1_Some' by simp
+
+lemma r_result1_saturating':
+  assumes "eval r_result1 [t, i, x] \<down>= Suc v"
+  shows "eval r_result1 [t + d, i, x] \<down>= Suc v"
+  using assms r_result1 r_result_saturating r_phi'' by simp
+
+lemma r_result1_saturating_the:
+  assumes "the (eval r_result1 [t, i, x]) > 0" and "t' \<ge> t"
+  shows "the (eval r_result1 [t', i, x]) > 0"
+proof -
+  from assms(1) obtain v where "eval r_result1 [t, i, x] \<down>= Suc v"
+    using r_result1_bivalent_phi r_result1_diverg_phi
+    by (metis inc_induct le_0_eq not_less_zero option.discI option.expand option.sel)
+  with assms have "eval r_result1 [t', i, x] \<down>= Suc v"
+    using r_result1_saturating' le_Suc_ex by blast
+  then show ?thesis by simp
+qed
+
+lemma Greatest_bounded_Suc:
+  fixes P :: "nat \<Rightarrow> nat"
+  shows "(if P n > 0 then Suc n
+          else if \<exists>j<n. P j > 0 then Suc (GREATEST j. j < n \<and> P j > 0) else 0) =
+    (if \<exists>j<Suc n. P j > 0 then Suc (GREATEST j. j < Suc n \<and> P j > 0) else 0)"
+      (is "?lhs = ?rhs")
+proof (cases "\<exists>j<Suc n. P j > 0")
+  case 1: True
+  show ?thesis
+  proof (cases "P n > 0")
+    case True
+    then have "(GREATEST j. j < Suc n \<and> P j > 0) = n"
+      using Greatest_equality[of "\<lambda>j. j < Suc n \<and> P j > 0"] by simp
+    moreover have "?rhs = Suc (GREATEST j. j < Suc n \<and> P j > 0)"
+      using 1 by simp
+    ultimately have "?rhs = Suc n" by simp
+    then show ?thesis using True by simp
+  next
+    case False
+    then have "?lhs = Suc (GREATEST j. j < n \<and> P j > 0)"
+      using 1 by (metis less_SucE)
+    moreover have "?rhs = Suc (GREATEST j. j < Suc n \<and> P j > 0)"
+      using 1 by simp
+    moreover have "(GREATEST j. j < n \<and> P j > 0) =
+        (GREATEST j. j < Suc n \<and> P j > 0)"
+      using 1 False by (metis less_SucI less_Suc_eq)
+    ultimately show ?thesis by simp
+  qed
+next
+  case False
+  then show ?thesis by auto
+qed
+
+text \<open>For $n$, $i$, $x$, the next function simulates $\varphi_i$ on all
+non-empty prefixes of at most length $n$ of the list $x$ for at most $n$
+steps. It returns the length of the longest such prefix for which $\varphi_i$
+halts, or zero if $\varphi_i$ does not halt for any prefix.\<close>
+
+definition "r_delay_aux \<equiv>
+  Pr 2 (r_constn 1 0)
+    (Cn 4 r_ifz
+      [Cn 4 r_result1
+        [Cn 4 r_length [Id 4 3], Id 4 2,
+         Cn 4 r_take [Cn 4 S [Id 4 0], Id 4 3]],
+       Id 4 1, Cn 4 S [Id 4 0]])"
+
+lemma r_delay_aux_prim: "prim_recfn 3 r_delay_aux"
+  unfolding r_delay_aux_def by simp_all
+
+lemma r_delay_aux_total: "total r_delay_aux"
+  using  prim_recfn_total[OF r_delay_aux_prim] .
+
+lemma r_delay_aux:
+  assumes "n \<le> e_length x"
+  shows "eval r_delay_aux [n, i, x] \<down>=
+   (if \<exists>j<n. the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0
+    then Suc (GREATEST j.
+                 j < n \<and>
+                 the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0)
+    else 0)"
+proof -
+  define z where "z \<equiv>
+    Cn 4 r_result1
+      [Cn 4 r_length [Id 4 3], Id 4 2, Cn 4 r_take [Cn 4 S [Id 4 0], Id 4 3]]"
+  then have z_recfn: "recfn 4 z" by simp
+  have z: "eval z [j, r, i, x] = eval r_result1 [e_length x, i, e_take (Suc j) x]"
+      if "j < e_length x" for j r i x
+    unfolding z_def using that by simp
+
+  define g where "g \<equiv> Cn 4 r_ifz [z, Id 4 1, Cn 4 S [Id 4 0]]"
+  then have g: "eval g [j, r, i, x] \<down>=
+      (if the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0 then Suc j else r)"
+      if "j < e_length x" for j r i x
+    using that z prim_recfn_total z_recfn by simp
+
+  show ?thesis
+    using assms
+  proof (induction n)
+    case 0
+    moreover have "eval r_delay_aux [0, i, x] \<down>= 0"
+      using eval_Pr_0 r_delay_aux_def r_delay_aux_prim r_constn
+      by (simp add: r_delay_aux_def)
+    ultimately show ?case by simp
+  next
+    case (Suc n)
+    let ?P = "\<lambda>j. the (eval r_result1 [e_length x, i, e_take (Suc j) x])"
+    have "eval r_delay_aux [n, i, x] \<down>"
+      using Suc by simp
+    moreover have "eval r_delay_aux [Suc n, i, x] =
+        eval (Pr 2 (r_constn 1 0) g) [Suc n, i, x]"
+      unfolding r_delay_aux_def g_def z_def by simp
+    ultimately have "eval r_delay_aux [Suc n, i, x] =
+        eval g [n, the (eval r_delay_aux [n, i, x]), i, x]"
+      using r_delay_aux_prim Suc eval_Pr_converg_Suc
+      by (simp add: r_delay_aux_def g_def z_def numeral_3_eq_3)
+    then have "eval r_delay_aux [Suc n, i, x] \<down>=
+        (if ?P n > 0 then Suc n
+         else if \<exists>j<n. ?P j > 0 then Suc (GREATEST j. j < n \<and> ?P j > 0) else 0)"
+      using g Suc by simp
+    then have "eval r_delay_aux [Suc n, i, x] \<down>=
+        (if \<exists>j<Suc n. ?P j > 0 then Suc (GREATEST j. j < Suc n \<and> ?P j > 0) else 0)"
+      using Greatest_bounded_Suc[where ?P="?P"] by simp
+    then show ?case by simp
+  qed
+qed
+
+text \<open>The next function simulates $\varphi_i$ on all non-empty prefixes
+of a list $x$ of length $n$ for at most $n$ steps and outputs the length of
+the longest prefix for which $\varphi_i$ halts, or zero if $\varphi_i$ does
+not halt for any such prefix.\<close>
+
+definition "r_delay \<equiv> Cn 2 r_delay_aux [Cn 2 r_length [Id 2 1], Id 2 0, Id 2 1]"
+
+lemma r_delay_recfn [simp]: "recfn 2 r_delay"
+  unfolding r_delay_def by (simp add: r_delay_aux_prim)
+
+lemma r_delay:
+  "eval r_delay [i, x] \<down>=
+    (if \<exists>j<e_length x. the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0
+     then Suc (GREATEST j.
+        j < e_length x \<and> the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0)
+     else 0)"
+  unfolding r_delay_def using r_delay_aux r_delay_aux_prim by simp
+
+definition "delay i x \<equiv> Some
+ (if \<exists>j<e_length x. the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0
+  then Suc (GREATEST j.
+    j < e_length x \<and> the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0)
+  else 0)"
+
+lemma delay_in_R2: "delay \<in> \<R>\<^sup>2"
+  using r_delay totalI2 R2I delay_def r_delay_recfn
+  by (metis (no_types, lifting) numeral_2_eq_2 option.simps(3))
+
+lemma delay_le_length: "the (delay i x) \<le> e_length x"
+proof (cases "\<exists>j<e_length x. the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0")
+  case True
+  let ?P = "\<lambda>j. j < e_length x \<and> the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0"
+  from True have "\<exists>j. ?P j" by simp
+  moreover have "\<And>y. ?P y \<Longrightarrow> y \<le> e_length x" by simp
+  ultimately have "?P (Greatest ?P)"
+    using GreatestI_ex_nat[where ?P="?P"] by blast
+  then have "Greatest ?P < e_length x" by simp
+  moreover have "delay i x \<down>= Suc (Greatest ?P)"
+    using delay_def True by simp
+  ultimately show ?thesis by auto
+next
+  case False
+  then show ?thesis using delay_def by auto
+qed
+
+lemma e_take_delay_init:
+  assumes "f \<in> \<R>" and "the (delay i (f \<triangleright> n)) > 0"
+  shows "e_take (the (delay i (f \<triangleright> n))) (f \<triangleright> n) = f \<triangleright> (the (delay i (f \<triangleright> n)) - 1)"
+  using assms e_take_init[of f _ n] length_init[of f n] delay_le_length[of i "f \<triangleright> n"]
+  by (metis One_nat_def Suc_le_lessD Suc_pred)
+
+lemma delay_gr0_converg:
+  assumes "the (delay i x) > 0"
+  shows "\<phi> i (e_take (the (delay i x)) x) \<down>"
+proof -
+  let ?P = "\<lambda>j. j < e_length x \<and> the (eval r_result1 [e_length x, i, e_take (Suc j) x]) > 0"
+  have "\<exists>j. ?P j"
+  proof (rule ccontr)
+    assume "\<not> (\<exists>j. ?P j)"
+    then have "delay i x \<down>= 0"
+      using delay_def by simp
+    with assms show False by simp
+  qed
+  then have d: "the (delay i x) = Suc (Greatest ?P)"
+    using delay_def by simp
+  moreover have "\<And>y. ?P y \<Longrightarrow> y \<le> e_length x" by simp
+  ultimately have "?P (Greatest ?P)"
+    using `\<exists>j. ?P j` GreatestI_ex_nat[where ?P="?P"] by blast
+  then have "the (eval r_result1 [e_length x, i, e_take (Suc (Greatest ?P)) x]) > 0"
+    by simp
+  then have "the (eval r_result1 [e_length x, i, e_take (the (delay i x)) x]) > 0"
+    using d by simp
+  then show ?thesis using r_result1_diverg_phi by fastforce
+qed
+
+lemma delay_unbounded:
+  fixes n :: nat
+  assumes "f \<in> \<R>" and "\<forall>n. \<phi> i (f \<triangleright> n) \<down>"
+  shows "\<exists>m. the (delay i (f \<triangleright> m)) > n"
+proof -
+  from assms have "\<exists>t. the (eval r_result1 [t, i, f \<triangleright> n]) > 0"
+    using r_result1_converg_phi
+    by (metis le_refl option.exhaust_sel option.sel zero_less_Suc)
+  then obtain t where t: "the (eval r_result1 [t, i, f \<triangleright> n]) > 0"
+    by auto
+  let ?m = "max n t"
+  have "Suc ?m \<ge> t" by simp
+  have m: "the (eval r_result1 [Suc ?m, i, f \<triangleright> n]) > 0"
+  proof -
+    let ?w = "eval r_result1 [t, i, f \<triangleright> n]"
+    obtain v where v: "?w \<down>= Suc v"
+      using t assms(2) r_result1_bivalent_phi by fastforce
+    have "eval r_result1 [Suc ?m, i, f \<triangleright> n] = ?w"
+      using v t r_result1_saturating' `Suc ?m \<ge> t` le_Suc_ex by fastforce
+    then show ?thesis using t by simp
+  qed
+  let ?x = "f \<triangleright> ?m"
+  have "the (delay i ?x) > n"
+  proof -
+    let ?P = "\<lambda>j. j < e_length ?x \<and> the (eval r_result1 [e_length ?x, i, e_take (Suc j) ?x]) > 0"
+    have "e_length ?x = Suc ?m" by simp
+    moreover have "e_take (Suc n) ?x = f \<triangleright> n"
+      using assms(1) e_take_init by auto
+    ultimately have "?P n"
+      using m by simp
+    have "\<And>y. ?P y \<Longrightarrow> y \<le> e_length ?x" by simp
+    with `?P n` have "n \<le> (Greatest ?P)"
+      using Greatest_le_nat[of ?P n "e_length ?x"] by simp
+    moreover have "the (delay i ?x) = Suc (Greatest ?P)"
+      using delay_def `?P n` by auto
+    ultimately show ?thesis by simp
+  qed
+  then show ?thesis by auto
+qed
+
+lemma delay_monotone:
+  assumes "f \<in> \<R>" and "n\<^sub>1 \<le> n\<^sub>2"
+  shows "the (delay i (f \<triangleright> n\<^sub>1)) \<le> the (delay i (f \<triangleright> n\<^sub>2))"
+    (is "the (delay i ?x1) \<le> the (delay i ?x2)")
+proof (cases "the (delay i (f \<triangleright> n\<^sub>1)) = 0")
+  case True
+  then show ?thesis by simp
+next
+  case False
+  let ?P1 = "\<lambda>j. j < e_length ?x1 \<and> the (eval r_result1 [e_length ?x1, i, e_take (Suc j) ?x1]) > 0"
+  let ?P2 = "\<lambda>j. j < e_length ?x2 \<and> the (eval r_result1 [e_length ?x2, i, e_take (Suc j) ?x2]) > 0"
+  from False have d1: "the (delay i ?x1) = Suc (Greatest ?P1)" "\<exists>j. ?P1 j"
+    using delay_def option.collapse by fastforce+
+  moreover have "\<And>y. ?P1 y \<Longrightarrow> y \<le> e_length ?x1" by simp
+  ultimately have *: "?P1 (Greatest ?P1)" using GreatestI_ex_nat[of ?P1] by blast
+  let ?j = "Greatest ?P1"
+  from * have "?j < e_length ?x1" by auto
+  then have 1: "e_take (Suc ?j) ?x1 = e_take (Suc ?j) ?x2"
+    using assms e_take_init by auto
+  from * have 2: "?j < e_length ?x2" using assms(2) by auto
+  with 1 * have "the (eval r_result1 [e_length ?x1, i, e_take (Suc ?j) ?x2]) > 0"
+    by simp
+  moreover have "e_length ?x1 \<le> e_length ?x2"
+    using assms(2) by auto
+  ultimately have "the (eval r_result1 [e_length ?x2, i, e_take (Suc ?j) ?x2]) > 0"
+    using r_result1_saturating_the by simp
+  with 2 have "?P2 ?j" by simp
+  then have d2: "the (delay i ?x2) = Suc (Greatest ?P2)"
+    using delay_def by auto
+  have "\<And>y. ?P2 y \<Longrightarrow> y \<le> e_length ?x2" by simp
+  with `?P2 ?j` have "?j \<le> (Greatest ?P2)" using Greatest_le_nat[of ?P2] by blast
+  with d1 d2 show ?thesis by simp
+qed
+
+lemma delay_unbounded_monotone:
+  fixes n :: nat
+  assumes "f \<in> \<R>" and "\<forall>n. \<phi> i (f \<triangleright> n) \<down>"
+  shows "\<exists>m\<^sub>0. \<forall>m\<ge>m\<^sub>0. the (delay i (f \<triangleright> m)) > n"
+proof -
+  from assms delay_unbounded obtain m\<^sub>0 where "the (delay i (f \<triangleright> m\<^sub>0)) > n"
+    by blast
+  then have "\<forall>m\<ge>m\<^sub>0. the (delay i (f \<triangleright> m)) > n"
+    using assms(1) delay_monotone order.strict_trans2 by blast
+  then show ?thesis by auto
+qed
+
+text \<open>Now we can define a function that simulates an arbitrary strategy
+$\varphi_i$ in a delayed way. The parameter $d$ is the default hypothesis for
+when $\varphi_i$ does not halt within the time bound for any prefix.\<close>
+
+definition r_totalizer :: "nat \<Rightarrow> recf" where
+  "r_totalizer d \<equiv>
+     Cn 2
+      (r_lifz
+        (r_constn 1 d)
+        (Cn 2 r_phi
+          [Id 2 0, Cn 2 r_take [Cn 2 r_delay [Id 2 0, Id 2 1], Id 2 1]]))
+      [Cn 2 r_delay [Id 2 0, Id 2 1], Id 2 0, Id 2 1]"
+
+lemma r_totalizer_recfn: "recfn 2 (r_totalizer d)"
+  unfolding r_totalizer_def by simp
+
+lemma r_totalizer:
+  "eval (r_totalizer d) [i, x] =
+    (if the (delay i x) = 0 then Some d else \<phi> i (e_take (the (delay i x)) x))"
+proof -
+  let ?i = "Cn 2 r_delay [Id 2 0, Id 2 1]"
+  have "eval ?i [i, x] = eval r_delay [i, x]" for i x
+    using r_delay_recfn by simp
+  then have i: "eval ?i [i, x] = delay i x" for i x
+    using r_delay by (simp add: delay_def)
+  let ?t = "r_constn 1 d"
+  have t: "eval ?t [i, x] \<down>= d" for i x by simp
+  let ?e1 = "Cn 2 r_take [?i, Id 2 1]"
+  let ?e = "Cn 2 r_phi [Id 2 0, ?e1]"
+  have "eval ?e1 [i, x] = eval r_take [the (delay i x), x]" for i x
+    using r_delay i delay_def by simp
+  then have "eval ?e1 [i, x] \<down>= e_take (the (delay i x)) x" for i x
+    using delay_le_length by simp
+  then have e: "eval ?e [i, x] = \<phi> i (e_take (the (delay i x)) x)"
+    using phi_def by simp
+  let ?z = "r_lifz ?t ?e"
+  have recfn_te: "recfn 2 ?t" "recfn 2 ?e"
+    by simp_all
+  then have "eval (r_totalizer d) [i, x] = eval (r_lifz ?t ?e) [the (delay i x), i, x]"
+      for i x
+    unfolding r_totalizer_def using i r_totalizer_recfn delay_def by simp
+  then have "eval (r_totalizer d) [i, x] =
+      (if the (delay i x) = 0 then eval ?t [i, x] else eval ?e [i, x])"
+      for i x
+    using recfn_te by simp
+  then show ?thesis using t e by simp
+qed
+
+lemma r_totalizer_total: "total (r_totalizer d)"
+proof (rule totalI2)
+  show "recfn 2 (r_totalizer d)" using r_totalizer_recfn by simp
+  show "\<And>x y. eval (r_totalizer d) [x, y] \<down>"
+    using r_totalizer delay_gr0_converg by simp
+qed
+
+definition totalizer :: "nat \<Rightarrow> partial2" where
+  "totalizer d i x \<equiv>
+     if the (delay i x) = 0 then Some d else \<phi> i (e_take (the (delay i x)) x)"
+
+lemma totalizer_init:
+  assumes "f \<in> \<R>"
+  shows "totalizer d i (f \<triangleright> n) =
+    (if the (delay i (f \<triangleright> n)) = 0 then Some d
+     else \<phi> i (f \<triangleright> (the (delay i (f \<triangleright> n)) - 1)))"
+  using assms e_take_delay_init by (simp add: totalizer_def)
+
+lemma totalizer_in_R2: "totalizer d \<in> \<R>\<^sup>2"
+  using totalizer_def r_totalizer r_totalizer_total R2I r_totalizer_recfn
+  by metis
+
+text \<open>For LIM, @{term totalizer} works with every default hypothesis
+$d$.\<close>
+
+lemma lemma_R_for_Lim:
+  assumes "learn_lim \<psi> U (\<phi> i)"
+  shows "learn_lim \<psi> U (totalizer d i)"
+proof (rule learn_limI)
+  show env: "environment \<psi> U (totalizer d i)"
+    using assms learn_limE(1) totalizer_in_R2 by auto
+  show "\<exists>j. \<psi> j = f \<and> (\<forall>\<^sup>\<infinity>n. totalizer d i (f \<triangleright> n) \<down>= j)" if "f \<in> U" for f
+  proof -
+    have "f \<in> \<R>"
+      using assms env that by auto
+    from assms learn_limE obtain j n\<^sub>0 where
+      j: "\<psi> j = f" and
+      n0: "\<forall>n\<ge>n\<^sub>0. (\<phi> i) (f \<triangleright> n) \<down>= j"
+      using `f \<in> U` by metis
+    obtain m\<^sub>0 where m0: "\<forall>m\<ge>m\<^sub>0. the (delay i (f \<triangleright> m)) > n\<^sub>0"
+      using delay_unbounded_monotone `f \<in> \<R>` \<open>f \<in> U\<close> assms learn_limE(1)
+      by blast
+    then have "\<forall>m\<ge>m\<^sub>0. totalizer d i (f \<triangleright> m) = \<phi> i (e_take (the (delay i (f \<triangleright> m))) (f \<triangleright> m))"
+      using totalizer_def by auto
+    then have "\<forall>m\<ge>m\<^sub>0. totalizer d i (f \<triangleright> m) = \<phi> i (f \<triangleright> (the (delay i (f \<triangleright> m)) - 1))"
+      using e_take_delay_init m0 `f \<in> \<R>` by auto
+    with m0 n0 have "\<forall>m\<ge>m\<^sub>0. totalizer d i (f \<triangleright> m) \<down>= j"
+      by auto
+    with j show ?thesis by auto
+  qed
+qed
+
+text \<open>The effective version of Lemma~R for LIM states that there is a
+total recursive function computing Gödel numbers of total strategies
+from those of arbitrary strategies.\<close>
+
+lemma lemma_R_for_Lim_effective:
+  "\<exists>g\<in>\<R>. \<forall>i.
+     \<phi> (the (g i)) \<in> \<R> \<and>
+     (\<forall>U \<psi>. learn_lim \<psi> U (\<phi> i) \<longrightarrow> learn_lim \<psi> U (\<phi> (the (g i))))"
+proof -
+  have "totalizer 0 \<in> \<P>\<^sup>2" using totalizer_in_R2 by auto
+  then obtain g where g: "g \<in> \<R>" "\<forall>i. (totalizer 0) i = \<phi> (the (g i))"
+    using numbering_translation_for_phi by blast
+  with totalizer_in_R2 have "\<forall>i. \<phi> (the (g i)) \<in> \<R>"
+    by (metis R2_proj_R1)
+  moreover from g(2) lemma_R_for_Lim[where ?d=0] have
+    "\<forall>i U \<psi>. learn_lim \<psi> U (\<phi> i) \<longrightarrow> learn_lim \<psi> U (\<phi> (the (g i)))"
+    by simp
+  ultimately show ?thesis using g(1) by blast
+qed
+
+text \<open>In order for us to use the previous lemma, we need a function
+that performs the actual computation:\<close>
+
+definition "r_limr \<equiv>
+ SOME g.
+   recfn 1 g \<and>
+   total g \<and>
+   (\<forall>i. \<phi> (the (eval g [i])) \<in> \<R> \<and>
+      (\<forall>U \<psi>. learn_lim \<psi> U (\<phi> i) \<longrightarrow> learn_lim \<psi> U (\<phi> (the (eval g [i])))))"
+
+lemma r_limr_recfn: "recfn 1 r_limr"
+  and r_limr_total: "total r_limr"
+  and r_limr:
+    "\<phi> (the (eval r_limr [i])) \<in> \<R>"
+    "learn_lim \<psi> U (\<phi> i) \<Longrightarrow> learn_lim \<psi> U (\<phi> (the (eval r_limr [i])))"
+proof -
+  let ?P = "\<lambda>g.
+    g \<in> \<R> \<and>
+    (\<forall>i. \<phi> (the (g i)) \<in> \<R> \<and> (\<forall>U \<psi>. learn_lim \<psi> U (\<phi> i) \<longrightarrow> learn_lim \<psi> U (\<phi> (the (g i)))))"
+  let ?Q = "\<lambda>g.
+    recfn 1 g \<and>
+    total g \<and>
+    (\<forall>i. \<phi> (the (eval g [i])) \<in> \<R> \<and> 
+       (\<forall>U \<psi>. learn_lim \<psi> U (\<phi> i) \<longrightarrow> learn_lim \<psi> U (\<phi> (the (eval g [i])))))"
+  have "\<exists>g. ?P g" using lemma_R_for_Lim_effective by auto
+  then obtain g where "?P g" by auto
+  then obtain g' where g': "recfn 1 g'" "total g'" "\<forall>i. eval g' [i] = g i"
+    by blast
+  with `?P g` have "?Q g'" by simp
+  with r_limr_def someI_ex[of ?Q] show
+    "recfn 1 r_limr"
+    "total r_limr"
+    "\<phi> (the (eval r_limr [i])) \<in> \<R>"
+    "learn_lim \<psi> U (\<phi> i) \<Longrightarrow> learn_lim \<psi> U (\<phi> (the (eval r_limr [i])))"
+    by auto
+qed
+
+text \<open>For BC, too, @{term totalizer} works with every default
+hypothesis $d$.\<close>
+
+lemma lemma_R_for_BC:
+  assumes "learn_bc \<psi> U (\<phi> i)"
+  shows "learn_bc \<psi> U (totalizer d i)"
+proof (rule learn_bcI)
+  show env: "environment \<psi> U (totalizer d i)"
+    using assms learn_bcE(1) totalizer_in_R2 by auto
+  show "\<exists>n\<^sub>0. \<forall>n\<ge>n\<^sub>0. \<psi> (the (totalizer d i (f \<triangleright> n))) = f" if "f \<in> U" for f
+  proof -
+    have "f \<in> \<R>"
+      using assms env that by auto
+    obtain n\<^sub>0 where n0: "\<forall>n\<ge>n\<^sub>0. \<psi> (the ((\<phi> i) (f \<triangleright> n))) = f"
+      using assms learn_bcE `f \<in> U` by metis
+    obtain m\<^sub>0 where m0: "\<forall>m\<ge>m\<^sub>0. the (delay i (f \<triangleright> m)) > n\<^sub>0"
+      using delay_unbounded_monotone `f \<in> \<R>` \<open>f \<in> U\<close> assms learn_bcE(1)
+      by blast
+    then have "\<forall>m\<ge>m\<^sub>0. totalizer d i (f \<triangleright> m) = \<phi> i (e_take (the (delay i (f \<triangleright> m))) (f \<triangleright> m))"
+      using totalizer_def by auto
+    then have "\<forall>m\<ge>m\<^sub>0. totalizer d i (f \<triangleright> m) = \<phi> i (f \<triangleright> (the (delay i (f \<triangleright> m)) - 1))"
+      using e_take_delay_init m0 `f \<in> \<R>` by auto
+    with m0 n0 have "\<forall>m\<ge>m\<^sub>0. \<psi> (the (totalizer d i (f \<triangleright> m))) = f"
+      by auto
+    then show ?thesis by auto
+  qed
+qed
+
+corollary lemma_R_for_BC_simple:
+  assumes "learn_bc \<psi> U s"
+  shows "\<exists>s'\<in>\<R>. learn_bc \<psi> U s'"
+  using assms lemma_R_for_BC totalizer_in_R2 learn_bcE
+  by (metis R2_proj_R1 learn_bcE(1) phi_universal)
+
+
+text \<open>For FIN the default hypothesis of @{term totalizer} must be
+zero, signalling ``don't know yet''.\<close>
+
+lemma lemma_R_for_FIN:
+  assumes "learn_fin \<psi> U (\<phi> i)"
+  shows "learn_fin \<psi> U (totalizer 0 i)"
+proof (rule learn_finI)
+  show env: "environment \<psi> U (totalizer 0 i)"
+    using assms learn_finE(1) totalizer_in_R2 by auto
+  show "\<exists>j n\<^sub>0. \<psi> j = f \<and>
+           (\<forall>n<n\<^sub>0. totalizer 0 i (f \<triangleright> n) \<down>= 0) \<and>
+           (\<forall>n\<ge>n\<^sub>0. totalizer 0 i (f \<triangleright> n) \<down>= Suc j)"
+      if "f \<in> U" for f
+  proof -
+    have "f \<in> \<R>"
+      using assms env that by auto
+    from assms learn_finE[of \<psi> U "\<phi> i"] obtain j where
+      j: "\<psi> j = f" and
+      ex_n0: "\<exists>n\<^sub>0. (\<forall>n<n\<^sub>0. (\<phi> i) (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. (\<phi> i) (f \<triangleright> n) \<down>= Suc j)"
+      using `f \<in> U` by blast
+    let ?Q = "\<lambda>n\<^sub>0. (\<forall>n<n\<^sub>0. (\<phi> i) (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. (\<phi> i) (f \<triangleright> n) \<down>= Suc j)"
+    define n\<^sub>0 where "n\<^sub>0 = Least ?Q"
+    with ex_n0 have n0: "?Q n\<^sub>0" "\<forall>n<n\<^sub>0. \<not> ?Q n"
+      using LeastI_ex[of ?Q] not_less_Least[of _ ?Q] by blast+
+    define m\<^sub>0 where "m\<^sub>0 = (LEAST m\<^sub>0. \<forall>m\<ge>m\<^sub>0. the (delay i (f \<triangleright> m)) > n\<^sub>0)"
+      (is "m\<^sub>0 = Least ?P")
+    moreover have "\<exists>m\<^sub>0. \<forall>m\<ge>m\<^sub>0. the (delay i (f \<triangleright> m)) > n\<^sub>0"
+      using delay_unbounded_monotone `f\<in>\<R>` \<open>f \<in> U\<close> assms learn_finE(1)
+      by simp
+    ultimately have m0: "?P m\<^sub>0" "\<forall>m<m\<^sub>0. \<not> ?P m"
+      using LeastI_ex[of ?P] not_less_Least[of _ ?P] by blast+
+    then have "\<forall>m\<ge>m\<^sub>0. totalizer 0 i (f \<triangleright> m) = \<phi> i (e_take (the (delay i (f \<triangleright> m))) (f \<triangleright> m))"
+      using totalizer_def by auto
+    then have "\<forall>m\<ge>m\<^sub>0. totalizer 0 i (f \<triangleright> m) = \<phi> i (f \<triangleright> (the (delay i (f \<triangleright> m)) - 1))"
+      using e_take_delay_init m0 `f\<in>\<R>` by auto
+    with m0 n0 have "\<forall>m\<ge>m\<^sub>0. totalizer 0 i (f \<triangleright> m) \<down>= Suc j"
+      by auto
+    moreover have "totalizer 0 i (f \<triangleright> m) \<down>= 0" if "m < m\<^sub>0" for m
+    proof (cases "the (delay i (f \<triangleright> m)) = 0")
+      case True
+      then show ?thesis by (simp add: totalizer_def)
+    next
+      case False
+      then have "the (delay i (f \<triangleright> m)) \<le> n\<^sub>0"
+        using m0 that `f \<in> \<R>` delay_monotone by (meson leI order.strict_trans2)
+      then show ?thesis
+        using \<open>f \<in> \<R>\<close> n0(1) totalizer_init by (simp add: Suc_le_lessD)
+    qed
+    ultimately show ?thesis using j by auto
+  qed
+qed
+
+
+subsection \<open>Weaker Lemma R for CP and TOTAL\<close>
+
+text \<open>For TOTAL the default hypothesis used by @{term totalizer}
+depends on the hypothesis space, because it must refer to a total function in
+that space. Consequently the total strategy depends on the hypothesis space,
+which makes this form of Lemma~R weaker than the ones in the previous
+section.\<close>
+
+lemma lemma_R_for_TOTAL:
+  fixes \<psi> :: partial2
+  shows "\<exists>d. \<forall>U. \<forall>i. learn_total \<psi> U (\<phi> i) \<longrightarrow>  learn_total \<psi> U (totalizer d i)"
+proof (cases "\<exists>d. \<psi> d \<in> \<R>")
+  case True
+  then obtain d where "\<psi> d \<in> \<R>" by auto
+  have "learn_total \<psi> U (totalizer d i)" if "learn_total \<psi> U (\<phi> i)" for U i
+  proof (rule learn_totalI)
+    show env: "environment \<psi> U (totalizer d i)"
+      using that learn_totalE(1) totalizer_in_R2 by auto
+    show "\<And>f. f \<in> U \<Longrightarrow> \<exists>j. \<psi> j = f \<and> (\<forall>\<^sup>\<infinity>n. totalizer d i (f \<triangleright> n) \<down>= j)"
+      using that learn_total_def lemma_R_for_Lim[where ?d=d] learn_limE(2) by metis
+    show "\<psi> (the (totalizer d i (f \<triangleright> n))) \<in> \<R>" if "f \<in> U" for f n
+    proof (cases "the (delay i (f \<triangleright> n)) = 0")
+      case True
+      then show ?thesis using totalizer_def `\<psi> d \<in> \<R>` by simp
+    next
+      case False
+      have "f \<in> \<R>"
+        using that env by auto
+      then show ?thesis
+        using False that `learn_total \<psi> U (\<phi> i)` totalizer_init learn_totalE(3)
+        by simp
+    qed
+  qed
+  then show ?thesis by auto
+next
+  case False
+  then show ?thesis using learn_total_def lemma_R_for_Lim by auto
+qed
+
+corollary lemma_R_for_TOTAL_simple:
+  assumes "learn_total \<psi> U s"
+  shows "\<exists>s'\<in>\<R>. learn_total \<psi> U s'"
+  using assms lemma_R_for_TOTAL totalizer_in_R2
+  by (metis R2_proj_R1 learn_totalE(1) phi_universal)
+
+text \<open>For CP the default hypothesis used by @{term totalizer} depends
+on both the hypothesis space and the class. Therefore the total strategy
+depends on both the the hypothesis space and the class, which makes Lemma~R
+for CP even weaker than the one for TOTAL.\<close>
+
+lemma lemma_R_for_CP:
+  fixes \<psi> :: partial2 and U :: "partial1 set"
+  assumes "learn_cp \<psi> U (\<phi> i)"
+  shows "\<exists>d. learn_cp \<psi> U (totalizer d i)"
+proof (cases "U = {}")
+  case True
+  then show ?thesis using assms learn_cp_def lemma_R_for_Lim by auto
+next
+  case False
+  then obtain f where "f \<in> U" by auto
+  from `f \<in> U` obtain d where "\<psi> d = f"
+    using learn_cpE(2)[OF assms] by auto
+  with `f \<in> U` have "\<psi> d \<in> U" by simp
+  have "learn_cp \<psi> U (totalizer d i)"
+  proof (rule learn_cpI)
+    show env: "environment \<psi> U (totalizer d i)"
+      using assms learn_cpE(1) totalizer_in_R2 by auto
+    show "\<And>f. f \<in> U \<Longrightarrow> \<exists>j. \<psi> j = f \<and> (\<forall>\<^sup>\<infinity>n. totalizer d i (f \<triangleright> n) \<down>= j)"
+      using assms learn_cp_def lemma_R_for_Lim[where ?d=d] learn_limE(2) by metis
+    show "\<psi> (the (totalizer d i (f \<triangleright> n))) \<in> U" if "f \<in> U" for f n
+    proof (cases "the (delay i (f \<triangleright> n)) = 0")
+      case True
+      then show ?thesis using totalizer_def `\<psi> d \<in> U` by simp
+    next
+      case False
+      then show ?thesis
+        using that env assms totalizer_init learn_cpE(3) by auto
+    qed
+  qed
+  then show ?thesis by auto
+qed
+
+
+subsection \<open>No Lemma R for CONS\<close>
+
+text \<open>This section demonstrates that the class $V_{01}$ of all total
+recursive functions $f$ where $f(0)$ or $f(1)$ is a Gödel number of $f$ can
+be consistently learned in the limit, but not by a total strategy. This implies
+that Lemma~R does not hold for CONS.\<close>
+
+definition V01 :: "partial1 set" ("V\<^sub>0\<^sub>1") where
+  "V\<^sub>0\<^sub>1 = {f. f \<in> \<R> \<and> (\<phi> (the (f 0)) = f \<or> \<phi> (the (f 1)) = f)}"
+
+
+subsubsection \<open>No total CONS strategy for @{term "V\<^sub>0\<^sub>1"}\label{s:v01_not_total}\<close>
+
+text \<open>In order to show that no total strategy can learn @{term
+"V\<^sub>0\<^sub>1"} we construct, for each total strategy $S$, one or two
+functions in @{term "V\<^sub>0\<^sub>1"} such that $S$ fails for at least one
+of them. At the core of this construction is a process that given a total
+recursive strategy $S$ and numbers $z, i, j \in \mathbb{N}$ builds a function
+$f$ as follows: Set $f(0) = i$ and $f(1) = j$. For $x\geq1$:
+\begin{enumerate}
+\item[(a)] Check whether $S$ changes its hypothesis when $f^x$ is
+  extended by 0, that is, if $S(f^x) \neq S(f^x0)$. If so, set $f(x+1) = 0$.
+\item[(b)] Otherwise check if $S$ changes its hypothesis when $f^x$ is extended
+  by $1$, that is, if $S(f^x) \neq S(f^x1)$. If so, set $f(x+1) = 1$.
+\item[(c)] If neither happens, set $f(x+1) = z$.
+\end{enumerate}
+In other words, as long as we can force $S$ to change its hypothesis by
+extending the function by 0 or 1, we do just that. Now there are two
+cases:
+\begin{enumerate}
+\item[Case 1.] For all $x\geq1$ either (a) or (b) occurs; then $S$
+  changes its hypothesis on $f$ all the time and thus does not learn $f$ in
+  the limit (not to mention consistently). The value of $z$ makes no
+  difference in this case.
+\item[Case 2.] For some minimal $x$, (c) occurs, that is,
+  there is an $f^x$ such that $h := S(f^x) = S(f^x0) = S(f^x1)$. But the
+  hypothesis $h$ cannot be consistent with both prefixes $f^x0$ and $f^x1$.
+  Running the process once with $z = 0$ and once with $z = 1$ yields two
+  functions starting with $f^x0$ and $f^x1$, respectively, such that $S$
+  outputs the same hypothesis, $h$, on both prefixes and thus cannot be
+  consistent for both functions.
+\end{enumerate}
+This process is computable because $S$ is total. The construction does not
+work if we only assume $S$ to be a CONS strategy for $V_{01}$, because we
+need to be able to apply $S$ to prefixes not in $V_{01}$.
+
+The parameters $i$ and $j$ provide flexibility to find functions built by the
+above process that are actually in $V_{01}$. To this end we will use
+Smullyan's double fixed-point theorem.\<close>
+
+context
+  fixes s :: partial1
+  assumes s_in_R1 [simp, intro]: "s \<in> \<R>"
+begin
+
+text \<open>The function @{term prefixes} constructs prefixes according to the
+aforementioned process.\<close>
+
+fun prefixes :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat list" where
+  "prefixes z i j 0 = [i]"
+| "prefixes z i j (Suc x) = prefixes z i j x @
+    [if x = 0 then j
+     else if s (list_encode (prefixes z i j x @ [0])) \<noteq> s (list_encode (prefixes z i j x))
+          then 0
+          else if s (list_encode (prefixes z i j x @ [1])) \<noteq> s (list_encode (prefixes z i j x))
+               then 1
+               else z]"
+
+lemma prefixes_length: "length (prefixes z i j x) = Suc x"
+  by (induction x) simp_all
+
+text \<open>The functions @{term[names_short] "adverse z i j"} are the
+functions constructed by @{term[names_short] "prefixes"}.\<close>
+
+definition adverse :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat option" where
+  "adverse z i j x \<equiv> Some (last (prefixes z i j x))"
+
+lemma init_adverse_eq_prefixes: "(adverse z i j) \<triangleright> n = list_encode (prefixes z i j n)"
+proof -
+  have "prefix (adverse z i j) n = prefixes z i j n"
+  proof (induction n)
+    case 0
+    then show ?case using adverse_def prefixes_length prefixI' by fastforce
+  next
+    case (Suc n)
+    then show ?case using adverse_def by (simp add: prefix_Suc)
+  qed
+  then show ?thesis by (simp add: init_def)
+qed
+
+lemma adverse_at_01:
+  "adverse z i j 0 \<down>= i"
+  "adverse z i j 1 \<down>= j"
+  by (auto simp add: adverse_def)
+
+text \<open>Had we introduced ternary partial recursive functions, the
+@{term[names_short] "adverse z"} functions would be among them.\<close>
+
+lemma adverse_in_R3: "\<exists>r. recfn 3 r \<and> total r \<and> (\<lambda>i j x. eval r [i, j, x]) = adverse z"
+proof -
+  obtain rs where rs: "recfn 1 rs" "total rs" "(\<lambda>x. eval rs [x]) = s"
+    using R1E by auto
+  have s_total: "\<And>x. s x \<down>" by simp
+
+  define f where "f = Cn 2 r_singleton_encode [Id 2 0]"
+  then have "recfn 2 f" by simp
+  have f: "\<And>i j. eval f [i, j] \<down>= list_encode [i]"
+    unfolding f_def by simp
+
+  define ch1 where "ch1 = Cn 4 r_ifeq
+    [Cn 4 rs [Cn 4 r_snoc [Id 4 1, r_constn 3 1]],
+     Cn 4 rs [Id 4 1],
+     r_dummy 3 (r_const z),
+     r_constn 3 1]"
+  then have ch1: "recfn 4 ch1" "total ch1"
+    using Cn_total prim_recfn_total rs by auto
+
+  define ch0 where "ch0 = Cn 4 r_ifeq
+    [Cn 4 rs [Cn 4 r_snoc [Id 4 1, r_constn 3 0]],
+     Cn 4 rs [Id 4 1],
+     ch1,
+     r_constn 3 0]"
+  then have ch0_total: "total ch0" "recfn 4 ch0"
+    using Cn_total prim_recfn_total rs ch1 by auto
+
+  have "eval ch1 [l, v, i, j] \<down>= (if s (e_snoc v 1) = s v then z else 1)" for l v i j
+  proof -
+    have "eval ch1 [l, v, i, j] = eval r_ifeq [the (s (e_snoc v 1)), the (s v), z, 1]"
+      unfolding ch1_def using rs by auto
+    then show ?thesis by (simp add: s_total option.expand)
+  qed
+  moreover have "eval ch0 [l, v, i, j] \<down>=
+    (if s (e_snoc v 0) = s v then the (eval ch1 [l, v, i, j]) else 0)" for l v i j
+  proof -
+    have "eval ch0 [l, v, i, j] =
+        eval r_ifeq [the (s (e_snoc v 0)), the (s v), the (eval ch1 [l, v, i, j]), 0]"
+      unfolding ch0_def using rs ch1 by auto
+    then show ?thesis by (simp add: s_total option.expand)
+  qed
+  ultimately have ch0: "\<And>l v i j. eval ch0 [l, v, i, j] \<down>=
+    (if s (e_snoc v 0) \<noteq> s v then 0
+     else if s (e_snoc v 1) \<noteq> s v then 1 else z)"
+    by simp
+
+  define app where "app = Cn 4 r_ifz [Id 4 0, Id 4 3, ch0]"
+  then have "recfn 4 app" "total app"
+    using ch0_total totalI4 by auto
+  have "eval app [l, v, i, j] \<down>= (if l = 0 then j else the (eval ch0 [l, v, i, j]))" for l v i j
+    unfolding app_def using ch0_total by simp
+  with ch0 have app: "\<And>l v i j. eval app [l, v, i, j] \<down>=
+    (if l = 0 then j
+     else if s (e_snoc v 0) \<noteq> s v then 0
+     else if s (e_snoc v 1) \<noteq> s v then 1 else z)"
+    by simp
+
+  define g where "g = Cn 4 r_snoc [Id 4 1, app]"
+  with app have g: "\<And>l v i j. eval g [l, v, i, j] \<down>= e_snoc v
+    (if l = 0 then j
+     else if s (e_snoc v 0) \<noteq> s v then 0
+     else if s (e_snoc v 1) \<noteq> s v then 1 else z)"
+    using `recfn 4 app` by auto
+  from g_def have "recfn 4 g" "total g"
+    using `recfn 4 app` `total app` Cn_total Mn_free_imp_total by auto
+
+  define b where "b = Pr 2 f g"
+  then have "recfn 3 b"
+    using `recfn 2 f` `recfn 4 g` by simp
+  have b: "eval b [x, i, j] \<down>= list_encode (prefixes z i j x)" for x i j
+  proof (induction x)
+    case 0
+    then show ?case
+      unfolding b_def using f `recfn 2 f` \<open>recfn 4 g\<close> by simp
+  next
+    case (Suc x)
+    then have "eval b [Suc x, i, j] = eval g [x, the (eval b [x, i, j]), i, j]"
+      using b_def `recfn 3 b` by simp
+    also have "... \<down>=
+     (let v = list_encode (prefixes z i j x)
+      in e_snoc v
+        (if x = 0 then j
+         else if s (e_snoc v 0) \<noteq> s v then 0
+              else if s (e_snoc v 1) \<noteq> s v then 1 else z))"
+      using g Suc by simp
+    also have "... \<down>=
+     (let v = list_encode (prefixes z i j x)
+      in e_snoc v
+        (if x = 0 then j
+         else if s (list_encode (prefixes z i j x @ [0])) \<noteq> s v then 0
+              else if s (list_encode (prefixes z i j x @ [1])) \<noteq> s v then 1 else z))"
+      using list_decode_encode by presburger
+    finally show ?case by simp
+  qed
+
+  define b' where "b' = Cn 3 b [Id 3 2, Id 3 0, Id 3 1]"
+  then have "recfn 3 b'"
+    using `recfn 3 b` by simp
+  with b have b': "\<And>i j x. eval b' [i, j, x] \<down>= list_encode (prefixes z i j x)"
+    using b'_def by simp
+
+  define r where "r = Cn 3 r_last [b']"
+  then have "recfn 3 r"
+    using `recfn 3 b'` by simp
+  with b' have "\<And>i j x. eval r [i, j, x] \<down>= last (prefixes z i j x)"
+    using r_def prefixes_length by auto
+  moreover from this have "total r"
+    using totalI3 `recfn 3 r` by simp
+  ultimately have "(\<lambda>i j x. eval r [i, j, x]) = adverse z"
+    unfolding adverse_def by simp
+  with `recfn 3 r` `total r` show ?thesis by auto
+qed
+
+lemma adverse_in_R1: "adverse z i j \<in> \<R>"
+proof -
+  from adverse_in_R3 obtain r where
+    r: "recfn 3 r" "total r" "(\<lambda>i j x. eval r [i, j, x]) = adverse z"
+    by blast
+  define rij where "rij = Cn 1 r [r_const i, r_const j, Id 1 0]"
+  then have "recfn 1 rij" "total rij"
+    using r(1,2) Cn_total Mn_free_imp_total by auto
+  from rij_def have "\<And>x. eval rij [x] = eval r [i, j, x]"
+    using r(1) by auto
+  with r(3) have "\<And>x. eval rij [x] = adverse z i j x"
+    by metis
+  with `recfn 1 rij` `total rij` show ?thesis by auto
+qed
+
+text \<open>Next we show that for every $z$ there are $i$, $j$ such that
+@{term[names_short] "adverse z i j \<in> V\<^sub>0\<^sub>1"}. The first step is to show that for every
+$z$, Gödel numbers for @{term[names_short] "adverse z i j"} can be computed
+uniformly from $i$ and $j$.\<close>
+
+lemma phi_translate_adverse: "\<exists>f\<in>\<R>\<^sup>2.\<forall>i j. \<phi> (the (f i j)) = adverse z i j"
+proof -
+  obtain r where r: "recfn 3 r" "total r" "(\<lambda>i j x. eval r [i, j, x]) = adverse z"
+    using adverse_in_R3 by blast
+  let ?p = "encode r"
+  define rf where "rf = Cn 2 (r_smn 1 2) [r_dummy 1 (r_const ?p), Id 2 0, Id 2 1]"
+  then have "recfn 2 rf" and "total rf"
+    using Mn_free_imp_total by simp_all
+  define f where "f \<equiv> \<lambda>i j. eval rf [i, j]"
+  with `recfn 2 rf` `total rf` have "f \<in> \<R>\<^sup>2" by auto
+  have rf: "eval rf [i, j] = eval (r_smn 1 2) [?p, i, j]" for i j
+    unfolding rf_def by simp
+  {
+    fix i j x
+    have "\<phi> (the (f i j)) x = eval r_phi [the (f i j), x]"
+      using phi_def by simp
+    also have "... = eval r_phi [the (eval rf [i, j]), x]"
+      using f_def by simp
+    also have "... = eval (r_universal 1) [the (eval (r_smn 1 2) [?p, i, j]), x]"
+      using rf r_phi_def by simp
+    also have "... = eval (r_universal (2 + 1)) (?p # [i, j] @ [x])" 
+      using smn_lemma[of 1 "[i, j]" 2 "[x]"] by simp
+    also have "... = eval (r_universal 3) [?p, i, j, x]" 
+      by simp
+    also have "... = eval r [i, j, x]" 
+      using r_universal r by simp
+    also have "... = adverse z i j x" 
+      using r(3) by metis
+    finally have "\<phi> (the (f i j)) x = adverse z i j x" .
+  }
+  with `f \<in> \<R>\<^sup>2` show ?thesis by blast
+qed
+
+text \<open>The second, and final, step is to apply Smullyan's double
+fixed-point theorem to show the existence of @{term[names_short] adverse}
+functions in @{term "V\<^sub>0\<^sub>1"}.\<close>
+
+lemma adverse_in_V01: "\<exists>m n. adverse 0 m n \<in> V\<^sub>0\<^sub>1 \<and> adverse 1 m n \<in> V\<^sub>0\<^sub>1"
+proof -
+  obtain f\<^sub>0 where f0: "f\<^sub>0 \<in> \<R>\<^sup>2" "\<forall>i j. \<phi> (the (f\<^sub>0 i j)) = adverse 0 i j"
+    using phi_translate_adverse[of 0] by auto
+  obtain f\<^sub>1 where f1: "f\<^sub>1 \<in> \<R>\<^sup>2" "\<forall>i j. \<phi> (the (f\<^sub>1 i j)) = adverse 1 i j"
+    using phi_translate_adverse[of 1] by auto
+  obtain m n where "\<phi> m = \<phi> (the (f\<^sub>0 m n))" and "\<phi> n = \<phi> (the (f\<^sub>1 m n))"
+    using smullyan_double_fixed_point[OF f0(1) f1(1)] by blast
+  with f0(2) f1(2) have "\<phi> m = adverse 0 m n" and "\<phi> n = adverse 1 m n"
+    by simp_all
+  moreover have "the (adverse 0 m n 0) = m" and "the (adverse 1 m n 1) = n"
+    using adverse_at_01 by simp_all
+  ultimately have
+    "\<phi> (the (adverse 0 m n 0)) = adverse 0 m n"
+    "\<phi> (the (adverse 1 m n 1)) = adverse 1 m n"
+    by simp_all
+  moreover have "adverse 0 m n \<in> \<R>" and "adverse 1 m n \<in> \<R>"
+    using adverse_in_R1 by simp_all
+  ultimately show ?thesis using V01_def by auto
+qed
+
+text \<open>Before we prove the main result of this section we need some
+lemmas regarding the shape of the @{term[names_short] adverse} functions and
+hypothesis changes of the strategy.\<close>
+
+lemma adverse_Suc:
+  assumes "x > 0"
+  shows "adverse z i j (Suc x) \<down>=
+    (if s (e_snoc ((adverse z i j) \<triangleright> x) 0) \<noteq> s ((adverse z i j) \<triangleright> x)
+     then 0
+     else if s (e_snoc ((adverse z i j) \<triangleright> x) 1) \<noteq> s ((adverse z i j) \<triangleright> x)
+          then 1 else z)"
+proof -
+  have "adverse z i j (Suc x) \<down>=
+    (if s (list_encode (prefixes z i j x @ [0])) \<noteq> s (list_encode (prefixes z i j x))
+     then 0
+     else if s (list_encode (prefixes z i j x @ [1])) \<noteq> s (list_encode (prefixes z i j x))
+          then 1 else z)"
+    using assms adverse_def by simp
+  then show ?thesis by (simp add: init_adverse_eq_prefixes)
+qed
+
+text \<open>The process in the proof sketch (page~\pageref{s:v01_not_total})
+consists of steps (a), (b), and (c). The next abbreviation is true iff.\ step
+(a) or (b) applies.\<close>
+
+abbreviation "hyp_change z i j x \<equiv>
+  s (e_snoc ((adverse z i j) \<triangleright> x) 0) \<noteq> s ((adverse z i j) \<triangleright> x) \<or>
+  s (e_snoc ((adverse z i j) \<triangleright> x) 1) \<noteq> s ((adverse z i j) \<triangleright> x)"
+
+text \<open>If step (c) applies, the process appends $z$.\<close>
+
+lemma adverse_Suc_not_hyp_change:
+  assumes "x > 0" and "\<not> hyp_change z i j x"
+  shows "adverse z i j (Suc x) \<down>= z"
+  using assms adverse_Suc by simp
+
+text \<open>While (a) or (b) applies, the process appends a value that
+forces $S$ to change its hypothesis.\<close>
+
+lemma while_hyp_change:
+  assumes "\<forall>x\<le>n. x > 0 \<longrightarrow> hyp_change z i j x"
+  shows "\<forall>x\<le>Suc n. adverse z i j x = adverse z' i j x"
+  using assms
+proof (induction n)
+  case 0
+  then show ?case by (simp add: adverse_def le_Suc_eq)
+next
+  case (Suc n)
+  then have "\<forall>x\<le>n. x > 0 \<longrightarrow> hyp_change z i j x" by simp
+  with Suc have "\<forall>x\<le>Suc n. x > 0 \<longrightarrow> adverse z i j x = adverse z' i j x"
+    by simp
+  moreover have "adverse z i j 0 = adverse z' i j 0"
+    using adverse_at_01 by simp
+  ultimately have zz': "\<forall>x\<le>Suc n. adverse z i j x = adverse z' i j x"
+    by auto
+  moreover have "adverse z i j \<in> \<R>" "adverse z' i j \<in> \<R>"
+    using adverse_in_R1 by simp_all
+  ultimately have init_zz': "(adverse z i j) \<triangleright> (Suc n) = (adverse z' i j) \<triangleright> (Suc n)"
+    using init_eqI by blast
+
+  have "adverse z i j (Suc (Suc n)) = adverse z' i j (Suc (Suc n))"
+  proof (cases "s (e_snoc ((adverse z i j) \<triangleright> (Suc n)) 0) \<noteq> s ((adverse z i j) \<triangleright> (Suc n))")
+    case True
+    then have "s (e_snoc ((adverse z' i j) \<triangleright> (Suc n)) 0) \<noteq> s ((adverse z' i j) \<triangleright> (Suc n))"
+      using init_zz' by simp
+    then have "adverse z' i j (Suc (Suc n)) \<down>= 0"
+      by (simp add: adverse_Suc)
+    moreover have "adverse z i j (Suc (Suc n)) \<down>= 0"
+      using True by (simp add: adverse_Suc)
+    ultimately show ?thesis by simp
+  next
+    case False
+    then have "s (e_snoc ((adverse z' i j) \<triangleright> (Suc n)) 0) = s ((adverse z' i j) \<triangleright> (Suc n))"
+      using init_zz' by simp
+    then have "adverse z' i j (Suc (Suc n)) \<down>= 1"
+      using init_zz' Suc.prems adverse_Suc by (smt le_refl zero_less_Suc)
+    moreover have "adverse z i j (Suc (Suc n)) \<down>= 1"
+      using False Suc.prems adverse_Suc by auto
+    ultimately show ?thesis by simp
+  qed
+  with zz' show ?case using le_SucE by blast
+qed
+
+text \<open>The next result corresponds to Case~1 from the proof sketch.\<close>
+
+lemma always_hyp_change_no_lim:
+  assumes "\<forall>x>0. hyp_change z i j x"
+  shows "\<not> learn_lim \<phi> {adverse z i j} s"
+proof (rule infinite_hyp_changes_not_Lim[of "adverse z i j"])
+  show "adverse z i j \<in> {adverse z i j}" by simp
+  show "\<forall>n. \<exists>m\<^sub>1>n. \<exists>m\<^sub>2>n. s (adverse z i j \<triangleright> m\<^sub>1) \<noteq> s (adverse z i j \<triangleright> m\<^sub>2)"
+  proof
+    fix n
+    from assms obtain m\<^sub>1 where m1: "m\<^sub>1 > n" "hyp_change z i j m\<^sub>1"
+      by auto
+    have "s (adverse z i j \<triangleright> m\<^sub>1) \<noteq> s (adverse z i j \<triangleright> (Suc m\<^sub>1))"
+    proof (cases "s (e_snoc ((adverse z i j) \<triangleright> m\<^sub>1) 0) \<noteq> s ((adverse z i j) \<triangleright> m\<^sub>1)")
+      case True
+      then have "adverse z i j (Suc m\<^sub>1) \<down>= 0"
+        using m1 adverse_Suc by simp
+      then have "(adverse z i j) \<triangleright> (Suc m\<^sub>1) = e_snoc ((adverse z i j) \<triangleright> m\<^sub>1) 0"
+        by (simp add: init_Suc_snoc)
+      with True show ?thesis by simp
+    next
+      case False
+      then have "adverse z i j (Suc m\<^sub>1) \<down>= 1"
+        using m1 adverse_Suc by simp
+      then have "(adverse z i j) \<triangleright> (Suc m\<^sub>1) = e_snoc ((adverse z i j) \<triangleright> m\<^sub>1) 1"
+        by (simp add: init_Suc_snoc)
+      with False m1(2) show ?thesis by simp
+    qed
+    then show "\<exists>m\<^sub>1>n. \<exists>m\<^sub>2>n. s (adverse z i j \<triangleright> m\<^sub>1) \<noteq> s (adverse z i j \<triangleright> m\<^sub>2)"
+      using less_SucI m1(1) by blast
+  qed
+qed
+
+text \<open>The next result corresponds to Case~2 from the proof sketch.\<close>
+
+lemma no_hyp_change_no_cons:
+  assumes "x > 0" and "\<not> hyp_change z i j x"
+  shows "\<not> learn_cons \<phi> {adverse 0 i j, adverse 1 i j} s"
+proof -
+  let ?P = "\<lambda>x. x > 0 \<and> \<not> hyp_change z i j x"
+  define xmin where "xmin = Least ?P"
+  with assms have xmin:
+    "?P xmin"
+    "\<And>x. x < xmin \<Longrightarrow> \<not> ?P x"
+    using LeastI[of ?P] not_less_Least[of _ ?P] by simp_all
+  then have "xmin > 0" by simp
+
+  have "\<forall>x\<le>xmin - 1. x > 0 \<longrightarrow> hyp_change z i j x"
+    using xmin by (metis One_nat_def Suc_pred le_imp_less_Suc)
+  then have
+    "\<forall>x\<le>xmin. adverse z i j x = adverse 0 i j x"
+    "\<forall>x\<le>xmin. adverse z i j x = adverse 1 i j x"
+    using while_hyp_change[of "xmin - 1" z i j 0]
+    using while_hyp_change[of "xmin - 1" z i j 1]
+    by simp_all
+  then have
+    init_z0: "(adverse z i j) \<triangleright> xmin = (adverse 0 i j) \<triangleright> xmin" and
+    init_z1: "(adverse z i j) \<triangleright> xmin = (adverse 1 i j) \<triangleright> xmin"
+    using adverse_in_R1 init_eqI by blast+
+  then have
+    a0: "adverse 0 i j (Suc xmin) \<down>= 0" and
+    a1: "adverse 1 i j (Suc xmin) \<down>= 1"
+    using adverse_Suc_not_hyp_change xmin(1) init_z1
+    by metis+
+  then have
+    i0: "(adverse 0 i j) \<triangleright> (Suc xmin) = e_snoc ((adverse z i j) \<triangleright> xmin) 0" and
+    i1: "(adverse 1 i j) \<triangleright> (Suc xmin) = e_snoc ((adverse z i j) \<triangleright> xmin) 1"
+    using init_z0 init_z1 by (simp_all add: init_Suc_snoc)
+  moreover have
+    "s (e_snoc ((adverse z i j) \<triangleright> xmin) 0) = s ((adverse z i j) \<triangleright> xmin)"
+    "s (e_snoc ((adverse z i j) \<triangleright> xmin) 1) = s ((adverse z i j) \<triangleright> xmin)"
+    using xmin by simp_all
+  ultimately have
+    "s ((adverse 0 i j) \<triangleright> (Suc xmin)) = s ((adverse z i j) \<triangleright> xmin)"
+    "s ((adverse 1 i j) \<triangleright> (Suc xmin)) = s ((adverse z i j) \<triangleright> xmin)"
+    by simp_all
+  then have
+    "s ((adverse 0 i j) \<triangleright> (Suc xmin)) = s ((adverse 1 i j) \<triangleright> (Suc xmin))"
+    by simp
+  moreover have "(adverse 0 i j) \<triangleright> (Suc xmin) \<noteq> (adverse 1 i j) \<triangleright> (Suc xmin)"
+    using a0 a1 i0 i1 by (metis append1_eq_conv list_decode_encode zero_neq_one)
+  ultimately show "\<not> learn_cons \<phi> {adverse 0 i j, adverse 1 i j} s"
+    using same_hyp_different_init_not_cons by blast
+qed
+
+text \<open>Combining the previous two lemmas shows that @{term
+"V\<^sub>0\<^sub>1"} cannot be learned consistently in the limit by the total
+strategy $S$.\<close>
+
+lemma V01_not_in_R_cons: "\<not> learn_cons \<phi> V\<^sub>0\<^sub>1 s"
+proof -
+  obtain m n where
+    mn0: "adverse 0 m n \<in> V\<^sub>0\<^sub>1" and
+    mn1: "adverse 1 m n \<in> V\<^sub>0\<^sub>1"
+    using adverse_in_V01 by auto
+  show "\<not> learn_cons \<phi> V\<^sub>0\<^sub>1 s"
+  proof (cases "\<forall>x>0. hyp_change 0 m n x")
+    case True
+    then have "\<not> learn_lim \<phi> {adverse 0 m n} s"
+      using always_hyp_change_no_lim by simp
+    with mn0 show ?thesis
+      using learn_cons_def learn_lim_closed_subseteq by auto
+  next
+    case False
+    then obtain x where x: "x > 0" "\<not> hyp_change 0 m n x" by auto
+    then have "\<not> learn_cons \<phi> {adverse 0 m n, adverse 1 m n} s"
+      using no_hyp_change_no_cons[OF x] by simp
+    with mn0 mn1 show ?thesis using learn_cons_closed_subseteq by auto
+  qed
+qed
+
+end
+
+
+subsubsection \<open>@{term "V\<^sub>0\<^sub>1"} is in CONS\<close>
+
+text \<open>At first glance, consistently learning @{term "V\<^sub>0\<^sub>1"} looks fairly
+easy. After all every @{term "f \<in> V\<^sub>0\<^sub>1"} provides a Gödel number of itself
+either at argument 0 or 1. A strategy only has to figure out which one is
+right. However, the strategy $S$ we are going to devise does not always
+converge to $f(0)$ or $f(1)$. Instead it uses a technique called
+``amalgamation''. The amalgamation of two Gödel numbers $i$ and $j$ is a
+function whose value at $x$ is determined by simulating $\varphi_i(x)$ and
+$\varphi_j(x)$ in parallel and outputting the value of the first one to halt.
+If neither halts the value is undefined. There is a function
+$a\in\mathcal{R}^2$ such that $\varphi_{a(i,j)}$ is the amalgamation of $i$
+and $j$.
+
+If @{term "f \<in> V\<^sub>0\<^sub>1"} then $\varphi_{a(f(0), f(1))}$ is
+total because by definition of @{term "V\<^sub>0\<^sub>1"} we have
+$\varphi_{f(0)} = f$ or $\varphi_{f(1)} = f$ and $f$ is total.
+
+Given a prefix $f^n$ of an @{term "f \<in> V\<^sub>0\<^sub>1"} the strategy
+$S$ first computes $\varphi_{a(f(0), f(1))}(x)$ for $x = 0, \ldots, n$. For
+the resulting prefix $\varphi^n_{a(f(0), f(1))}$ there are two cases:
+\begin{enumerate}
+\item[Case 1.] It differs from $f^n$, say at minimum index $x$. Then for
+  either $z = 0$ or $z = 1$ we have $\varphi_{f(z)}(x) \neq f(x)$ by
+  definition of amalgamation. This
+  implies $\varphi_{f(z)} \neq f$, and thus $\varphi_{f(1-z)} = f$ by
+  definition of @{term "V\<^sub>0\<^sub>1"}. We set $S(f^n) = f(1 - z)$. This
+  hypothesis is correct and hence consistent.
+\item[Case 2.] It equals $f^n$. Then we set $S(f^n) = a(f(0), f(1))$. This
+  hypothesis is consistent by definition of this case.
+\end{enumerate}
+
+In both cases the hypothesis is consistent. If Case~1 holds for some $n$, the
+same $x$ and $z$ will be found also for all larger values of $n$. Therefore
+$S$ converges to the correct hypothesis $f(1 - z)$. If Case~2 holds for all
+$n$, then $S$ always outputs the same hypothesis $a(f(0), f(1))$ and thus
+also converges.
+
+The above discussion tacitly assumes $n \geq 1$, such that both $f(0)$ and
+$f(1)$ are available to $S$. For $n = 0$ the strategy outputs an arbitrary
+consistent hypothesis.\<close>
+
+text \<open>Amalgamation uses the concurrent simulation of functions.\<close>
+
+definition parallel :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat option" where
+  "parallel i j x \<equiv> eval r_parallel [i, j, x]"
+
+lemma r_parallel': "eval r_parallel [i, j, x] = parallel i j x"
+  using parallel_def by simp
+
+lemma r_parallel'':
+  shows "eval r_phi [i, x] \<up> \<and> eval r_phi [j, x] \<up> \<Longrightarrow> eval r_parallel [i, j, x] \<up>"
+    and "eval r_phi [i, x] \<down> \<and> eval r_phi [j, x] \<up> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval r_phi [i, x]))"
+    and "eval r_phi [j, x] \<down> \<and> eval r_phi [i, x] \<up> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval r_phi [j, x]))"
+    and "eval r_phi [i, x] \<down> \<and> eval r_phi [j, x] \<down> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval r_phi [i, x])) \<or>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval r_phi [j, x]))"
+proof -
+  let ?f = "Cn 1 r_phi [r_const i, Id 1 0]"
+  let ?g = "Cn 1 r_phi [r_const j, Id 1 0]"
+  have *: "\<And>x. eval r_phi [i, x] = eval ?f [x]" "\<And>x. eval r_phi [j, x] = eval ?g [x]"
+    by simp_all
+  show "eval r_phi [i, x] \<up> \<and> eval r_phi [j, x] \<up> \<Longrightarrow> eval r_parallel [i, j, x] \<up>"
+    and "eval r_phi [i, x] \<down> \<and> eval r_phi [j, x] \<up> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval r_phi [i, x]))"
+    and "eval r_phi [j, x] \<down> \<and> eval r_phi [i, x] \<up> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval r_phi [j, x]))"
+    and "eval r_phi [i, x] \<down> \<and> eval r_phi [j, x] \<down> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval r_phi [i, x])) \<or>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval r_phi [j, x]))"
+    using r_parallel[OF *] by simp_all
+qed
+
+lemma parallel:
+  "\<phi> i x \<up> \<and> \<phi> j x \<up> \<Longrightarrow> parallel i j x \<up>"
+  "\<phi> i x \<down> \<and> \<phi> j x \<up> \<Longrightarrow> parallel i j x \<down>= prod_encode (0, the (\<phi> i x))"
+  "\<phi> j x \<down> \<and> \<phi> i x \<up> \<Longrightarrow> parallel i j x \<down>= prod_encode (1, the (\<phi> j x))"
+  "\<phi> i x \<down> \<and> \<phi> j x \<down> \<Longrightarrow>
+     parallel i j x \<down>= prod_encode (0, the (\<phi> i x)) \<or>
+     parallel i j x \<down>= prod_encode (1, the (\<phi> j x))"
+  using phi_def r_parallel'' r_parallel parallel_def by simp_all
+
+lemma parallel_converg_pdec1_0_or_1:
+  assumes "parallel i j x \<down>"
+  shows "pdec1 (the (parallel i j x)) = 0 \<or> pdec1 (the (parallel i j x)) = 1"
+  using assms parallel[of i x j] parallel(3)[of j x i]
+  by (metis fst_eqD option.sel prod_encode_inverse)
+
+lemma parallel_converg_either: "(\<phi> i x \<down> \<or> \<phi> j x \<down>) = (parallel i j x \<down>)"
+  using parallel by (metis option.simps(3))
+
+lemma parallel_0:
+  assumes "parallel i j x \<down>= prod_encode (0, v)"
+  shows "\<phi> i x \<down>= v"
+  using parallel assms
+  by (smt option.collapse option.sel option.simps(3) prod.inject prod_encode_eq zero_neq_one)
+
+lemma parallel_1:
+  assumes "parallel i j x \<down>= prod_encode (1, v)"
+  shows "\<phi> j x \<down>= v"
+  using parallel assms
+  by (smt option.collapse option.sel option.simps(3) prod.inject prod_encode_eq zero_neq_one)
+
+lemma parallel_converg_V01:
+  assumes "f \<in> V\<^sub>0\<^sub>1"
+  shows "parallel (the (f 0)) (the (f 1)) x \<down>"
+proof -
+  have "f \<in> \<R> \<and> (\<phi> (the (f 0)) = f \<or> \<phi> (the (f 1)) = f)"
+    using assms V01_def by auto
+  then have "\<phi> (the (f 0)) \<in> \<R> \<or> \<phi> (the (f 1)) \<in> \<R>"
+    by auto
+  then have "\<phi> (the (f 0)) x \<down> \<or> \<phi> (the (f 1)) x \<down>"
+    using R1_imp_total1 by auto
+  then show ?thesis using parallel_converg_either by simp
+qed
+
+text \<open>The amalgamation of two Gödel numbers can then be described
+in terms of @{term "parallel"}.\<close>
+
+definition amalgamation :: "nat \<Rightarrow> nat \<Rightarrow> partial1" where
+  "amalgamation i j x \<equiv>
+     if parallel i j x \<up> then None else Some (pdec2 (the (parallel i j x)))"
+
+lemma amalgamation_diverg: "amalgamation i j x \<up> \<longleftrightarrow> \<phi> i x \<up> \<and> \<phi> j x \<up>"
+  using amalgamation_def parallel by (metis option.simps(3))
+
+lemma amalgamation_total:
+  assumes "total1 (\<phi> i) \<or> total1 (\<phi> j)"
+  shows "total1 (amalgamation i j)"
+  using assms amalgamation_diverg[of i j] total_def by auto
+
+lemma amalgamation_V01_total:
+  assumes "f \<in> V\<^sub>0\<^sub>1"
+  shows "total1 (amalgamation (the (f 0)) (the (f 1)))"
+  using assms V01_def amalgamation_total R1_imp_total1 total1_def
+  by (metis (mono_tags, lifting) mem_Collect_eq)
+
+definition "r_amalgamation \<equiv> Cn 3 r_pdec2 [r_parallel]"
+
+lemma r_amalgamation_recfn: "recfn 3 r_amalgamation"
+  unfolding r_amalgamation_def by simp
+
+lemma r_amalgamation: "eval r_amalgamation [i, j, x] = amalgamation i j x"
+proof (cases "parallel i j x \<up>")
+  case True
+  then have "eval r_parallel [i, j, x] \<up>"
+    by (simp add: r_parallel')
+  then have "eval r_amalgamation [i, j, x] \<up>"
+    unfolding r_amalgamation_def by simp
+  moreover from True have "amalgamation i j x \<up>"
+    using amalgamation_def by simp
+  ultimately show ?thesis by simp
+next
+  case False
+  then have "eval r_parallel [i, j, x] \<down>"
+    by (simp add: r_parallel')
+  then have "eval r_amalgamation [i, j, x] = eval r_pdec2 [the (eval r_parallel [i, j, x])]"
+    unfolding r_amalgamation_def by simp
+  also have "... \<down>= pdec2 (the (eval r_parallel [i, j, x]))"
+    by simp
+  finally show ?thesis by (simp add: False amalgamation_def r_parallel')
+qed
+
+text \<open>The function @{term "amalgamate"} computes Gödel numbers of
+amalgamations. It corresponds to the function $a$ from the proof sketch.\<close>
+
+definition amalgamate :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "amalgamate i j \<equiv> smn 1 (encode r_amalgamation) [i, j]"
+
+lemma amalgamate: "\<phi> (amalgamate i j) = amalgamation i j"
+proof
+  fix x
+  have "\<phi> (amalgamate i j) x = eval r_phi [amalgamate i j, x]"
+    by (simp add: phi_def)
+  also have "... = eval r_phi [smn 1 (encode r_amalgamation) [i, j], x]"
+    using amalgamate_def by simp
+  also have "... = eval r_phi
+     [encode (Cn 1 (r_universal 3)
+      (r_constn 0 (encode r_amalgamation) # map (r_constn 0) [i, j] @ map (Id 1) [0])), x]"
+    using smn[of 1 "encode r_amalgamation" "[i, j]"] by (simp add: numeral_3_eq_3)
+  also have "... = eval r_phi
+     [encode (Cn 1 (r_universal 3)
+      (r_const (encode r_amalgamation) # [r_const i, r_const j, Id 1 0])), x]"
+     (is "... = eval r_phi [encode ?f, x]")
+    by (simp add: r_constn_def)
+  finally have "\<phi> (amalgamate i j) x = eval r_phi
+     [encode (Cn 1 (r_universal 3)
+      (r_const (encode r_amalgamation) # [r_const i, r_const j, Id 1 0])), x]" .
+  then have "\<phi> (amalgamate i j) x = eval (r_universal 3) [encode r_amalgamation, i, j, x]"
+    unfolding r_phi_def using r_universal[of ?f 1] r_amalgamation_recfn by simp
+  then show "\<phi> (amalgamate i j) x = amalgamation i j x"
+    using r_amalgamation by (simp add: r_amalgamation_recfn r_universal)
+qed
+
+lemma amalgamation_in_P1: "amalgamation i j \<in> \<P>"
+  using amalgamate by (metis P2_proj_P1 phi_in_P2)
+
+lemma amalgamation_V01_R1:
+  assumes "f \<in> V\<^sub>0\<^sub>1"
+  shows "amalgamation (the (f 0)) (the (f 1)) \<in> \<R>"
+  using assms amalgamation_V01_total amalgamation_in_P1
+  by (simp add: P1_total_imp_R1)
+
+definition "r_amalgamate \<equiv>
+  Cn 2 (r_smn 1 2) [r_dummy 1 (r_const (encode r_amalgamation)), Id 2 0, Id 2 1]"
+
+lemma r_amalgamate_recfn: "recfn 2 r_amalgamate"
+  unfolding r_amalgamate_def by simp
+
+lemma r_amalgamate: "eval r_amalgamate [i, j] \<down>= amalgamate i j"
+proof -
+  let ?p = "encode r_amalgamation"
+  have rs21: "eval (r_smn 1 2) [?p, i, j] \<down>= smn 1 ?p [i, j]"
+    using r_smn by simp
+  moreover have "eval r_amalgamate [i, j] = eval (r_smn 1 2) [?p, i, j]"
+    unfolding r_amalgamate_def by auto
+  ultimately have "eval r_amalgamate [i, j] \<down>= smn 1 ?p [i, j]"
+    by simp
+  then show ?thesis using amalgamate_def by simp
+qed
+
+text \<open>The strategy $S$ distinguishes the two cases from the proof
+sketch with the help of the next function, which checks if a hypothesis
+$\varphi_i$ is inconsistent with a prefix $e$. If so, it returns the least $x
+< |e|$ witnessing the inconsistency; otherwise it returns the length $|e|$.
+If $\varphi_i$ diverges for some $x < |e|$, so does the function.\<close>
+
+definition inconsist :: partial2 where
+  "inconsist i e \<equiv>
+    (if \<exists>x<e_length e. \<phi> i x \<up> then None
+     else if \<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x
+          then Some (LEAST x. x < e_length e \<and> \<phi> i x \<down>\<noteq> e_nth e x)
+          else Some (e_length e))"
+
+lemma inconsist_converg:
+  assumes "inconsist i e \<down>"
+  shows "inconsist i e =
+    (if \<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x
+     then Some (LEAST x. x < e_length e \<and> \<phi> i x \<down>\<noteq> e_nth e x)
+     else Some (e_length e))"
+    and "\<forall>x<e_length e. \<phi> i x \<down>"
+  using inconsist_def assms by (presburger, meson)
+
+lemma inconsist_bounded:
+  assumes "inconsist i e \<down>"
+  shows "the (inconsist i e) \<le> e_length e"
+proof (cases "\<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x")
+  case True
+  then show ?thesis
+    using inconsist_converg[OF assms]
+    by (smt Least_le dual_order.strict_implies_order dual_order.strict_trans2 option.sel)
+next
+  case False
+  then show ?thesis using inconsist_converg[OF assms] by auto
+qed
+
+lemma inconsist_consistent:
+  assumes "inconsist i e \<down>"
+  shows "inconsist i e \<down>= e_length e \<longleftrightarrow> (\<forall>x<e_length e. \<phi> i x \<down>= e_nth e x)"
+proof
+  show "\<forall>x<e_length e. \<phi> i x \<down>= e_nth e x" if "inconsist i e \<down>= e_length e"
+  proof (cases "\<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x")
+    case True
+    then show ?thesis
+      using that inconsist_converg[OF assms]
+      by (metis (mono_tags, lifting) not_less_Least option.inject)
+  next
+    case False
+    then show ?thesis
+      using that inconsist_converg[OF assms] by simp
+  qed
+  show "\<forall>x<e_length e. \<phi> i x \<down>= e_nth e x \<Longrightarrow> inconsist i e \<down>= e_length e"
+    unfolding inconsist_def using assms by auto
+qed
+
+lemma inconsist_converg_eq:
+  assumes "inconsist i e \<down>= e_length e"
+  shows "\<forall>x<e_length e. \<phi> i x \<down>= e_nth e x"
+  using assms inconsist_consistent by auto
+
+lemma inconsist_converg_less:
+  assumes "inconsist i e \<down>" and "the (inconsist i e) < e_length e"
+  shows "\<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x"
+    and "inconsist i e \<down>= (LEAST x. x < e_length e \<and> \<phi> i x \<down>\<noteq> e_nth e x)"
+proof -
+  show "\<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x"
+    using assms by (metis (no_types, lifting) inconsist_converg(1) nat_neq_iff option.sel)
+  then show "inconsist i e \<down>= (LEAST x. x < e_length e \<and> \<phi> i x \<down>\<noteq> e_nth e x)"
+    using assms inconsist_converg by presburger
+qed
+
+lemma least_bounded_Suc:
+  assumes "\<exists>x. x < upper \<and> P x"
+  shows "(LEAST x. x < upper \<and> P x) = (LEAST x. x < Suc upper \<and> P x)"
+proof -
+  let ?Q = "\<lambda>x. x < upper \<and> P x"
+  let ?x = "Least ?Q"
+  from assms have "?x < upper \<and> P ?x"
+    using LeastI_ex[of ?Q] by simp
+  then have 1: "?x < Suc upper \<and> P ?x" by simp
+  from assms have 2: "\<forall>y<?x. \<not> P y"
+    using Least_le[of ?Q] not_less_Least by fastforce
+  have "(LEAST x. x < Suc upper \<and> P x) = ?x"
+  proof (rule Least_equality)
+    show "?x < Suc upper \<and> P ?x" using 1 2 by blast
+    show "\<And>y. y < Suc upper \<and> P y \<Longrightarrow> ?x \<le> y"
+      using 1 2 leI by blast
+  qed
+  then show ?thesis ..
+qed
+
+lemma least_bounded_gr:
+  fixes P :: "nat \<Rightarrow> bool" and m :: nat
+  assumes "\<exists>x. x < upper \<and> P x"
+  shows "(LEAST x. x < upper \<and> P x) = (LEAST x. x < upper + m \<and> P x)"
+proof (induction m)
+  case 0
+  then show ?case by simp
+next
+  case (Suc m)
+  moreover have "\<exists>x. x < upper + m \<and> P x"
+    using assms trans_less_add1 by blast
+  ultimately show ?case using least_bounded_Suc by simp
+qed
+
+lemma inconsist_init_converg_less:
+  assumes "f \<in> \<R>"
+    and "\<phi> i \<in> \<R>"
+    and "inconsist i (f \<triangleright> n) \<down>"
+    and "the (inconsist i (f \<triangleright> n)) < Suc n"
+  shows "inconsist i (f \<triangleright> (n + m)) = inconsist i (f \<triangleright> n)"
+proof -
+  have phi_i_total: "\<phi> i x \<down>" for x
+    using assms by simp
+  moreover have f_nth: "f x \<down>= e_nth (f \<triangleright> n) x" if "x < Suc n" for x n
+    using that assms(1) by simp
+  ultimately have "(\<phi> i x \<noteq> f x) = (\<phi> i x \<down>\<noteq> e_nth (f \<triangleright> n) x)" if "x < Suc n" for x n
+    using that by simp
+  then have cond: "(x < Suc n \<and> \<phi> i x \<noteq> f x) =
+      (x < e_length (f \<triangleright> n) \<and> \<phi> i x \<down>\<noteq> e_nth (f \<triangleright> n) x)" for x n
+    using length_init by metis
+  then have
+    1: "\<exists>x<Suc n. \<phi> i x \<noteq> f x" and
+    2: "inconsist i (f \<triangleright> n) \<down>= (LEAST x. x < Suc n \<and> \<phi> i x \<noteq> f x)"
+    using assms(3,4) inconsist_converg_less[of i "f \<triangleright> n"] by simp_all
+  then have 3: "\<exists>x<Suc (n + m). \<phi> i x \<noteq> f x"
+    using not_add_less1 by fastforce
+  then have "\<exists>x<Suc (n + m). \<phi> i x \<down>\<noteq> e_nth (f \<triangleright> (n + m)) x"
+    using cond by blast
+  then have "\<exists>x<e_length (f \<triangleright> (n + m)). \<phi> i x \<down>\<noteq> e_nth (f \<triangleright> (n + m)) x"
+    by simp
+  moreover have 4: "inconsist i (f \<triangleright> (n + m)) \<down>"
+    using assms(2) R1_imp_total1 inconsist_def by simp
+  ultimately have "inconsist i (f \<triangleright> (n + m)) \<down>=
+      (LEAST x. x < e_length (f \<triangleright> (n + m)) \<and> \<phi> i x \<down>\<noteq> e_nth (f \<triangleright> (n + m)) x)"
+    using inconsist_converg[OF 4] by simp
+  then have 5: "inconsist i (f \<triangleright> (n + m)) \<down>= (LEAST x. x < Suc (n + m) \<and> \<phi> i x \<noteq> f x)"
+    using cond[of _ "n + m"] by simp
+  then have "(LEAST x. x < Suc n \<and> \<phi> i x \<noteq> f x) =
+      (LEAST x. x < Suc n + m \<and> \<phi> i x \<noteq> f x)"
+    using least_bounded_gr[where ?upper="Suc n"] 1 3 by simp
+  then show ?thesis using 2 5 by simp
+qed
+
+definition "r_inconsist \<equiv>
+  let
+    f = Cn 2 r_length [Id 2 1];
+    g = Cn 4 r_ifless
+      [Id 4 1,
+       Cn 4 r_length [Id 4 3],
+       Id 4 1,
+       Cn 4 r_ifeq
+        [Cn 4 r_phi [Id 4 2, Id 4 0],
+         Cn 4 r_nth [Id 4 3, Id 4 0],
+         Id 4 1,
+         Id 4 0]]
+   in Cn 2 (Pr 2 f g) [Cn 2 r_length [Id 2 1], Id 2 0, Id 2 1]"
+
+lemma r_inconsist_recfn: "recfn 2 r_inconsist"
+  unfolding r_inconsist_def by simp
+
+lemma r_inconsist: "eval r_inconsist [i, e] = inconsist i e"
+proof -
+  define f where "f = Cn 2 r_length [Id 2 1]"
+  define len where "len = Cn 4 r_length [Id 4 3]"
+  define nth where "nth = Cn 4 r_nth [Id 4 3, Id 4 0]"
+  define ph where "ph = Cn 4 r_phi [Id 4 2, Id 4 0]"
+  define g where
+    "g = Cn 4 r_ifless [Id 4 1, len, Id 4 1, Cn 4 r_ifeq [ph, nth, Id 4 1, Id 4 0]]"
+  have "recfn 2 f"
+    unfolding f_def by simp
+  have f: "eval f [i, e] \<down>= e_length e"
+    unfolding f_def by simp
+  have "recfn 4 len"
+    unfolding len_def by simp
+  have len: "eval len [j, v, i, e] \<down>= e_length e" for j v
+    unfolding len_def by simp
+  have "recfn 4 nth"
+    unfolding nth_def by simp
+  have nth: "eval nth [j, v, i, e] \<down>= e_nth e j" for j v
+    unfolding nth_def by simp
+  have "recfn 4 ph"
+    unfolding ph_def by simp
+  have ph: "eval ph [j, v, i, e] = \<phi> i j" for j v
+    unfolding ph_def using phi_def by simp
+  have "recfn 4 g"
+    unfolding g_def using `recfn 4 nth` `recfn 4 ph` `recfn 4 len` by simp
+  have g_diverg: "eval g [j, v, i, e] \<up>" if "eval ph [j, v, i, e] \<up>" for j v
+    unfolding g_def using that `recfn 4 nth` `recfn 4 ph` `recfn 4 len` by simp
+  have g_converg: "eval g [j, v, i, e] \<down>=
+      (if v < e_length e then v else if \<phi> i j \<down>= e_nth e j then v else j)"
+      if "eval ph [j, v, i, e] \<down>" for j v
+    unfolding g_def using that `recfn 4 nth` `recfn 4 ph` `recfn 4 len` len nth ph
+    by auto
+  define h where "h \<equiv> Pr 2 f g"
+  then have "recfn 3 h"
+    by (simp add: \<open>recfn 2 f\<close> \<open>recfn 4 g\<close>)
+
+  let ?invariant = "\<lambda>j i e.
+    (if \<exists>x<j. \<phi> i x \<up> then None
+     else if \<exists>x<j. \<phi> i x \<down>\<noteq> e_nth e x
+          then Some (LEAST x. x < j \<and> \<phi> i x \<down>\<noteq> e_nth e x)
+          else Some (e_length e))"
+
+  have "eval h [j, i, e] = ?invariant j i e" if "j \<le> e_length e" for j
+    using that
+  proof (induction j)
+    case 0
+    then show ?case unfolding h_def using `recfn 2 f` f `recfn 4 g` by simp
+  next
+    case (Suc j)
+    then have j_less: "j < e_length e" by simp
+    then have j_le: "j \<le> e_length e" by simp
+    show ?case
+    proof (cases "eval h [j, i, e] \<up>")
+      case True
+      then have "\<exists>x<j. \<phi> i x \<up>"
+        using j_le Suc.IH by (metis option.simps(3))
+      then have "\<exists>x<Suc j. \<phi> i x \<up>"
+        using less_SucI by blast
+      moreover have h: "eval h [Suc j, i, e] \<up>"
+        using True h_def `recfn 3 h` by simp
+      ultimately show ?thesis by simp
+    next
+      case False
+      with Suc.IH j_le have h_j: "eval h [j, i, e] =
+        (if \<exists>x<j. \<phi> i x \<down>\<noteq> e_nth e x
+         then Some (LEAST x. x < j \<and> \<phi> i x \<down>\<noteq> e_nth e x)
+         else Some (e_length e))"
+        by presburger
+      then have the_h_j: "the (eval h [j, i, e]) =
+        (if \<exists>x<j. \<phi> i x \<down>\<noteq> e_nth e x
+         then LEAST x. x < j \<and> \<phi> i x \<down>\<noteq> e_nth e x
+         else e_length e)"
+         (is "_ = ?v")
+        by auto
+      have h_Suc: "eval h [Suc j, i, e] = eval g [j, the (eval h [j, i, e]), i, e]"
+        using False h_def `recfn 4 g` `recfn 2 f` by auto
+      show ?thesis
+      proof (cases "\<phi> i j \<up>")
+        case True
+        with ph g_diverg h_Suc show ?thesis by auto
+      next
+        case False
+        with h_Suc have "eval h [Suc j, i, e] \<down>=
+          (if ?v < e_length e then ?v
+           else if \<phi> i j \<down>= e_nth e j then ?v else j)"
+          (is "_ \<down>= ?lhs")
+          using g_converg ph the_h_j by simp
+        moreover have "?invariant (Suc j) i e \<down>=
+          (if \<exists>x<Suc j. \<phi> i x \<down>\<noteq> e_nth e x
+           then LEAST x. x < Suc j \<and> \<phi> i x \<down>\<noteq> e_nth e x
+           else e_length e)"
+          (is "_ \<down>= ?rhs")
+        proof -
+          from False have "\<phi> i j \<down>" by simp
+          moreover have "\<not> (\<exists>x<j. \<phi> i x \<up>)"
+            by (metis (no_types, lifting) Suc.IH h_j j_le option.simps(3))
+          ultimately have "\<not> (\<exists>x<Suc j. \<phi> i x \<up>)"
+            using less_Suc_eq by auto
+          then show ?thesis by auto
+        qed
+        moreover have "?lhs = ?rhs"
+        proof (cases "?v < e_length e")
+          case True
+          then have
+            ex_j: "\<exists>x<j. \<phi> i x \<down>\<noteq> e_nth e x" and
+            v_eq: "?v = (LEAST x. x < j \<and> \<phi> i x \<down>\<noteq> e_nth e x)"
+            by presburger+
+          with True have "?lhs = ?v" by simp
+          from ex_j have "\<exists>x<Suc j. \<phi> i x \<down>\<noteq> e_nth e x"
+            using less_SucI by blast
+          then have "?rhs = (LEAST x. x < Suc j \<and> \<phi> i x \<down>\<noteq> e_nth e x)" by simp
+          with True v_eq ex_j show ?thesis
+            using least_bounded_Suc[of j "\<lambda>x. \<phi> i x \<down>\<noteq> e_nth e x"] by simp
+        next
+          case False
+          then have not_ex: "\<not> (\<exists>x<j. \<phi> i x \<down>\<noteq> e_nth e x)"
+            using Least_le[of "\<lambda>x. x < j \<and> \<phi> i x \<down>\<noteq> e_nth e x"] j_le
+            by (smt leD le_less_linear le_trans)
+          then have "?v = e_length e" by argo
+          with False have lhs: "?lhs = (if \<phi> i j \<down>= e_nth e j then e_length e else j)"
+            by simp
+          show ?thesis
+          proof (cases "\<phi> i j \<down>= e_nth e j")
+            case True
+            then have "\<not> (\<exists>x<Suc j. \<phi> i x \<down>\<noteq> e_nth e x)"
+              using less_SucE not_ex by blast
+            then have "?rhs = e_length e" by argo
+            moreover from True have "?lhs = e_length e"
+              using lhs by simp
+            ultimately show ?thesis by simp
+          next case False
+            then have "\<phi> i j \<down>\<noteq> e_nth e j"
+              using `\<phi> i j \<down>` by simp
+            with not_ex have "(LEAST x. x<Suc j \<and> \<phi> i x \<down>\<noteq> e_nth e x) = j"
+              using LeastI[of "\<lambda>x. x<Suc j \<and> \<phi> i x \<down>\<noteq> e_nth e x" j] less_Suc_eq
+              by blast
+            then have "?rhs = j"
+              using \<open>\<phi> i j \<down>\<noteq> e_nth e j\<close> by (meson lessI)
+            moreover from False lhs have "?lhs = j" by simp
+            ultimately show ?thesis by simp
+          qed
+        qed
+        ultimately show ?thesis by simp
+      qed
+    qed
+  qed
+  then have "eval h [e_length e, i, e] = ?invariant (e_length e) i e"
+    by auto
+  then have "eval h [e_length e, i, e] = inconsist i e"
+    using inconsist_def by simp
+  moreover have "eval (Cn 2 (Pr 2 f g) [Cn 2 r_length [Id 2 1], Id 2 0, Id 2 1]) [i, e] =
+      eval h [e_length e, i, e]"
+    using `recfn 4 g` `recfn 2 f` h_def by auto
+  ultimately show ?thesis
+    unfolding r_inconsist_def by (simp add: f_def g_def len_def nth_def ph_def)
+qed
+
+lemma inconsist_for_total:
+  assumes "total1 (\<phi> i)"
+  shows "inconsist i e \<down>=
+    (if \<exists>x<e_length e. \<phi> i x \<down>\<noteq> e_nth e x
+     then LEAST x. x < e_length e \<and> \<phi> i x \<down>\<noteq> e_nth e x
+     else e_length e)"
+  unfolding inconsist_def using assms total1_def by (auto; blast)
+
+lemma inconsist_for_V01:
+  assumes "f \<in> V\<^sub>0\<^sub>1" and "k = amalgamate (the (f 0)) (the (f 1))"
+  shows "inconsist k e \<down>=
+    (if \<exists>x<e_length e. \<phi> k x \<down>\<noteq> e_nth e x
+     then LEAST x. x < e_length e \<and> \<phi> k x \<down>\<noteq> e_nth e x
+     else e_length e)"
+proof -
+  have "\<phi> k \<in> \<R>"
+    using amalgamation_V01_R1[OF assms(1)] assms(2) amalgamate by simp
+  then have "total1 (\<phi> k)" by simp
+  with inconsist_for_total[of k] show ?thesis by simp
+qed
+
+text \<open>The next function computes Gödel numbers of functions consistent
+with a given prefix. The strategy will use these as consistent auxiliary
+hypotheses when receiving a prefix of length one.\<close>
+
+definition "r_auxhyp \<equiv> Cn 1 (r_smn 1 1) [r_const (encode r_prenum), Id 1 0]"
+
+lemma r_auxhyp_prim: "prim_recfn 1 r_auxhyp"
+  unfolding r_auxhyp_def by simp
+
+lemma r_auxhyp: "\<phi> (the (eval r_auxhyp [e])) = prenum e"
+proof
+  fix x
+  let ?p = "encode r_prenum"
+  let ?p = "encode r_prenum"
+  have "eval r_auxhyp [e] = eval (r_smn 1 1) [?p, e]"
+    unfolding r_auxhyp_def by simp
+  then have "eval r_auxhyp [e] \<down>= smn 1 ?p [e]"
+    by (simp add: r_smn)
+  also have "... \<down>= encode (Cn 1 (r_universal (1 + length [e]))
+      (r_constn (1 - 1) ?p #
+       map (r_constn (1 - 1)) [e] @ map (recf.Id 1) [0..<1]))"
+    using smn[of 1 ?p "[e]"] by simp
+  also have "... \<down>= encode (Cn 1 (r_universal (1 + 1))
+      (r_constn 0 ?p # map (r_constn 0) [e] @ [Id 1 0]))"
+    by simp
+  also have "... \<down>= encode (Cn 1 (r_universal 2)
+      (r_constn 0 ?p # map (r_constn 0) [e] @ [Id 1 0]))"
+    by (metis one_add_one)
+  also have "... \<down>= encode (Cn 1 (r_universal 2) [r_constn 0 ?p, r_constn 0 e, Id 1 0])"
+    by simp
+  also have "... \<down>= encode (Cn 1 (r_universal 2) [r_const ?p, r_const e, Id 1 0])"
+    using r_constn_def by simp
+  finally have "eval r_auxhyp [e] \<down>=
+    encode (Cn 1 (r_universal 2) [r_const ?p, r_const e, Id 1 0])" .
+  moreover have "\<phi> (the (eval r_auxhyp [e])) x = eval r_phi [the (eval r_auxhyp [e]), x]"
+    by (simp add: phi_def)
+  ultimately have "\<phi> (the (eval r_auxhyp [e])) x =
+      eval r_phi [encode (Cn 1 (r_universal 2) [r_const ?p, r_const e, Id 1 0]), x]"
+      (is "_ = eval r_phi [encode ?f, x]")
+    by simp
+  then have "\<phi> (the (eval r_auxhyp [e])) x =
+      eval (Cn 1 (r_universal 2) [r_const ?p, r_const e, Id 1 0]) [x]"
+    using r_phi_def r_universal[of ?f 1 "[x]"] by simp
+  then have "\<phi> (the (eval r_auxhyp [e])) x = eval (r_universal 2) [?p, e, x]"
+    by simp
+  then have "\<phi> (the (eval r_auxhyp [e])) x = eval r_prenum [e, x]"
+    using r_universal by simp
+  then show "\<phi> (the (eval r_auxhyp [e])) x = prenum e x" by simp
+qed
+
+definition auxhyp :: partial1 where
+  "auxhyp e \<equiv> eval r_auxhyp [e]"
+
+lemma auxhyp_prenum: "\<phi> (the (auxhyp e)) = prenum e"
+  using auxhyp_def r_auxhyp by metis
+
+lemma auxhyp_in_R1: "auxhyp \<in> \<R>"
+  using auxhyp_def Mn_free_imp_total R1I r_auxhyp_prim by metis
+
+text \<open>Now we can define our consistent learning strategy for @{term "V\<^sub>0\<^sub>1"}.\<close>
+
+definition "r_sv01 \<equiv>
+  let
+    at0 = Cn 1 r_nth [Id 1 0, Z];
+    at1 = Cn 1 r_nth [Id 1 0, r_const 1];
+    m = Cn 1 r_amalgamate [at0, at1];
+    c = Cn 1 r_inconsist [m, Id 1 0];
+    p = Cn 1 r_pdec1 [Cn 1 r_parallel [at0, at1, c]];
+    g = Cn 1 r_ifeq [c, r_length, m, Cn 1 r_ifz [p, at1, at0]]
+  in Cn 1 (r_lifz r_auxhyp g) [Cn 1 r_eq [r_length, r_const 1], Id 1 0]"
+
+lemma r_sv01_recfn: "recfn 1 r_sv01"
+  unfolding r_sv01_def using r_auxhyp_prim r_inconsist_recfn r_amalgamate_recfn
+  by (simp add: Let_def)
+
+definition sv01 :: partial1 ("s\<^bsub>01\<^esub>")where
+  "sv01 e \<equiv> eval r_sv01 [e]"
+
+lemma sv01_in_P1: "s\<^bsub>01\<^esub> \<in> \<P>"
+  using sv01_def r_sv01_recfn P1I by presburger
+
+text \<open>We are interested in the behavior of @{term "s\<^bsub>01\<^esub>"} only on
+prefixes of functions in @{term "V\<^sub>0\<^sub>1"}. This behavior is linked
+to the amalgamation of $f(0)$ and $f(1)$, where $f$ is the function
+to be learned.\<close>
+
+abbreviation amalg01 :: "partial1 \<Rightarrow> nat" where
+  "amalg01 f \<equiv> amalgamate (the (f 0)) (the (f 1))"
+
+lemma sv01:
+  assumes "f \<in> V\<^sub>0\<^sub>1"
+  shows "s\<^bsub>01\<^esub> (f \<triangleright> 0) = auxhyp (f \<triangleright> 0)"
+    and "n \<noteq> 0 \<Longrightarrow>
+      inconsist (amalg01 f) (f \<triangleright> n) \<down>= Suc n \<Longrightarrow>
+      s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>= amalg01 f"
+    and "n \<noteq> 0 \<Longrightarrow>
+      the (inconsist (amalg01 f) (f \<triangleright> n)) < Suc n \<Longrightarrow>
+      pdec1 (the (parallel (the (f 0)) (the (f 1)) (the (inconsist (amalg01 f) (f \<triangleright> n))))) = 0 \<Longrightarrow>
+      s\<^bsub>01\<^esub> (f \<triangleright> n) = f 1"
+    and "n \<noteq> 0 \<Longrightarrow>
+      the (inconsist (amalg01 f) (f \<triangleright> n)) < Suc n \<Longrightarrow>
+      pdec1 (the (parallel (the (f 0)) (the (f 1)) (the (inconsist (amalg01 f) (f \<triangleright> n))))) \<noteq> 0 \<Longrightarrow>
+      s\<^bsub>01\<^esub> (f \<triangleright> n) = f 0"
+proof -
+  have f_total: "\<And>x. f x \<down>"
+    using assms V01_def R1_imp_total1 by blast
+  define at0 where "at0 = Cn 1 r_nth [Id 1 0, Z]"
+  define at1 where "at1 = Cn 1 r_nth [Id 1 0, r_const 1]"
+  define m where  "m = Cn 1 r_amalgamate [at0, at1]"
+  define c where "c = Cn 1 r_inconsist [m, Id 1 0]"
+  define p where "p = Cn 1 r_pdec1 [Cn 1 r_parallel [at0, at1, c]]"
+  define g where "g = Cn 1 r_ifeq [c, r_length, m, Cn 1 r_ifz [p, at1, at0]]"
+  have "recfn 1 g"
+    unfolding g_def p_def c_def m_def at1_def at0_def
+    using r_auxhyp_prim r_inconsist_recfn r_amalgamate_recfn
+    by simp
+  have "eval (Cn 1 r_eq [r_length, r_const 1]) [f \<triangleright> 0] \<down>= 0"
+    by simp
+  then have "eval r_sv01 [f \<triangleright> 0] = eval r_auxhyp [f \<triangleright> 0]"
+    unfolding r_sv01_def using `recfn 1 g` c_def g_def m_def p_def r_auxhyp_prim
+    by (auto simp add: Let_def)
+  then show "s\<^bsub>01\<^esub> (f \<triangleright> 0) = auxhyp (f \<triangleright> 0)"
+    by (simp add: auxhyp_def sv01_def)
+
+  have sv01: "s\<^bsub>01\<^esub> (f \<triangleright> n) = eval g [f \<triangleright> n]" if "n \<noteq> 0"
+  proof -
+    have *: "eval (Cn 1 r_eq [r_length, r_const 1]) [f \<triangleright> n] \<down>\<noteq> 0"
+      (is "?r_eq \<down>\<noteq> 0")
+      using that by simp
+    moreover have "recfn 2 (r_lifz r_auxhyp g)"
+      using `recfn 1 g` r_auxhyp_prim by simp
+    moreover have "eval r_sv01 [f \<triangleright> n] =
+        eval (Cn 1 (r_lifz r_auxhyp g) [Cn 1 r_eq [r_length, r_const 1], Id 1 0]) [f \<triangleright> n]"
+      using r_sv01_def by (metis at0_def at1_def c_def g_def m_def p_def)
+    ultimately have "eval r_sv01 [f \<triangleright> n] = eval (r_lifz r_auxhyp g) [the ?r_eq, f \<triangleright> n]"
+      by simp
+    then have "eval r_sv01 [f \<triangleright> n] = eval g [f \<triangleright> n]"
+      using "*" \<open>recfn 1 g\<close> r_auxhyp_prim by auto
+    then show ?thesis by (simp add: sv01_def that)
+  qed
+
+  have "recfn 1 at0"
+    unfolding at0_def by simp
+  have at0: "eval at0 [f \<triangleright> n] \<down>= the (f 0)"
+    unfolding at0_def by simp
+  have "recfn 1 at1"
+    unfolding at1_def by simp
+  have at1: "n \<noteq> 0 \<Longrightarrow> eval at1 [f \<triangleright> n] \<down>= the (f 1)"
+    unfolding at1_def by simp
+  have "recfn 1 m"
+    unfolding m_def at0_def at1_def using r_amalgamate_recfn by simp
+  have m: "n \<noteq> 0 \<Longrightarrow> eval m [f \<triangleright> n] \<down>= amalg01 f"
+      (is "_ \<Longrightarrow> _ \<down>= ?m")
+    unfolding m_def at0_def at1_def
+    using at0 at1 amalgamate r_amalgamate r_amalgamate_recfn by simp
+  then have c: "n \<noteq> 0 \<Longrightarrow> eval c [f \<triangleright> n] = inconsist (amalg01 f) (f \<triangleright> n)"
+      (is "_ \<Longrightarrow> _ = ?c")
+    unfolding c_def using r_inconsist_recfn `recfn 1 m` r_inconsist by auto
+  then have c_converg: "n \<noteq> 0 \<Longrightarrow> eval c [f \<triangleright> n] \<down>"
+    using inconsist_for_V01[OF assms] by simp
+  have "recfn 1 c"
+    unfolding c_def using `recfn 1 m` r_inconsist_recfn by simp
+
+  have par: "n \<noteq> 0 \<Longrightarrow>
+      eval (Cn 1 r_parallel [at0, at1, c]) [f \<triangleright> n] = parallel (the (f 0)) (the (f 1)) (the ?c)"
+      (is "_ \<Longrightarrow> _ = ?par")
+    using at0 at1 c c_converg m r_parallel' `recfn 1 at0` `recfn 1 at1` `recfn 1 c`
+    by simp
+  with parallel_converg_V01[OF assms] have
+      par_converg: "n \<noteq> 0 \<Longrightarrow> eval (Cn 1 r_parallel [at0, at1, c]) [f \<triangleright> n] \<down>"
+    by simp
+  then have p_converg: "n \<noteq> 0 \<Longrightarrow> eval p [f \<triangleright> n] \<down>"
+    unfolding p_def using at0 at1 c_converg `recfn 1 at0` `recfn 1 at1` `recfn 1 c`
+    by simp
+  have p: "n \<noteq> 0 \<Longrightarrow> eval p [f \<triangleright> n] \<down>= pdec1 (the ?par)"
+    unfolding p_def
+    using at0 at1 c_converg `recfn 1 at0` `recfn 1 at1` `recfn 1 c` par par_converg
+    by simp
+  have "recfn 1 p"
+    unfolding p_def using `recfn 1 at0` `recfn 1 at1` `recfn 1 m` `recfn 1 c`
+    by simp
+
+  let ?r = "Cn 1 r_ifz [p, at1, at0]"
+  have r: "n \<noteq> 0 \<Longrightarrow> eval ?r [f \<triangleright> n] = (if pdec1 (the ?par) = 0 then f 1 else f 0)"
+    using at0 at1 c_converg `recfn 1 at0` `recfn 1 at1` `recfn 1 c`
+      `recfn 1 m` `recfn 1 p` p f_total
+    by fastforce
+
+  have g: "n \<noteq> 0 \<Longrightarrow>
+      eval g [f \<triangleright> n] \<down>=
+        (if the ?c = e_length (f \<triangleright> n)
+         then ?m else the (eval (Cn 1 r_ifz [p, at1, at0]) [f \<triangleright> n]))"
+    unfolding g_def
+    using `recfn 1 p` `recfn 1 at0` `recfn 1 at1` `recfn 1 c` `recfn 1 m`
+      p_converg at1 at0 c c_converg m
+    by simp
+  {
+    assume "n \<noteq> 0" and "?c \<down>= Suc n"
+    moreover have "e_length (f \<triangleright> n) = Suc n" by simp
+    ultimately have "eval g [f \<triangleright> n] \<down>= ?m" using g by simp
+    then show "s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>= amalg01 f"
+      using sv01[OF `n \<noteq> 0`] by simp
+  next
+    assume "n \<noteq> 0" and "the ?c < Suc n" and "pdec1 (the ?par) = 0"
+    with g r f_total have "eval g [f \<triangleright> n] = f 1" by simp
+    then show "s\<^bsub>01\<^esub> (f \<triangleright> n) = f 1"
+      using sv01[OF `n \<noteq> 0`] by simp
+  next
+    assume "n \<noteq> 0" and "the ?c < Suc n" and "pdec1 (the ?par) \<noteq> 0"
+    with g r f_total have "eval g [f \<triangleright> n] = f 0" by simp
+    then show "s\<^bsub>01\<^esub> (f \<triangleright> n) = f 0"
+      using sv01[OF `n \<noteq> 0`] by simp
+  }
+qed
+
+text \<open>Part of the correctness of @{term sv01} is convergence on
+prefixes of functions in @{term "V\<^sub>0\<^sub>1"}.\<close>
+
+lemma sv01_converg_V01:
+  assumes "f \<in> V\<^sub>0\<^sub>1"
+  shows "s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>"
+proof (cases "n = 0")
+  case True
+  then show ?thesis
+    using assms sv01 R1_imp_total1 auxhyp_in_R1 by simp
+next
+  case n_gr_0: False
+  show ?thesis
+  proof (cases "inconsist (amalg01 f) (f \<triangleright> n) \<down>= Suc n")
+    case True
+    then show ?thesis
+    using n_gr_0 assms sv01 by simp
+  next
+    case False
+    then have "the (inconsist (amalg01 f) (f \<triangleright> n)) < Suc n"
+      using assms inconsist_bounded inconsist_for_V01 length_init
+      by (metis (no_types, lifting) le_neq_implies_less option.collapse option.simps(3))
+    then show ?thesis
+      using n_gr_0 assms sv01 R1_imp_total1 total1E V01_def
+      by (metis (no_types, lifting) mem_Collect_eq)
+  qed
+qed
+
+text \<open>Another part of the correctness of @{term sv01} is its hypotheses
+being consistent on prefixes of functions in @{term "V\<^sub>0\<^sub>1"}.\<close>
+
+lemma sv01_consistent_V01:
+  assumes "f \<in> V\<^sub>0\<^sub>1"
+  shows "\<forall>x\<le>n. \<phi> (the (s\<^bsub>01\<^esub> (f \<triangleright> n))) x = f x"
+proof (cases "n = 0")
+  case True
+  then have "s\<^bsub>01\<^esub> (f \<triangleright> n) = auxhyp (f \<triangleright> n)"
+    using sv01[OF assms] by simp
+  then have "\<phi> (the (s\<^bsub>01\<^esub> (f \<triangleright> n))) = prenum (f \<triangleright> n)"
+    using auxhyp_prenum by simp
+  then show ?thesis
+    using R1_imp_total1 total1E assms by (simp add: V01_def)
+next
+  case n_gr_0: False
+  let ?m = "amalg01 f"
+  let ?e = "f \<triangleright> n"
+  let ?c = "the (inconsist ?m ?e)"
+  have c: "inconsist ?m ?e \<down>"
+    using assms inconsist_for_V01 by blast
+  show ?thesis
+  proof (cases "inconsist ?m ?e \<down>= Suc n")
+    case True
+    then show ?thesis
+      using assms n_gr_0 sv01 R1_imp_total1 total1E V01_def is_init_of_def
+        inconsist_consistent not_initial_imp_not_eq length_init inconsist_converg_eq 
+      by (metis (no_types, lifting) le_imp_less_Suc mem_Collect_eq option.sel)
+  next
+    case False
+    then have less: "the (inconsist ?m ?e) < Suc n"
+      using c assms inconsist_bounded inconsist_for_V01 length_init
+      by (metis le_neq_implies_less option.collapse)
+    then have "the (inconsist ?m ?e) < e_length ?e"
+      by auto
+    then have
+      "\<exists>x<e_length ?e. \<phi> ?m x \<down>\<noteq> e_nth ?e x"
+      "inconsist ?m ?e \<down>= (LEAST x. x < e_length ?e \<and> \<phi> ?m x \<down>\<noteq> e_nth ?e x)"
+      (is "_ \<down>= Least ?P")
+      using inconsist_converg_less[OF c] by simp_all
+    then have "?P ?c" and "\<And>x. x < ?c \<Longrightarrow> \<not> ?P x"
+      using LeastI_ex[of ?P] not_less_Least[of _ ?P] by (auto simp del: e_nth)
+    then have "\<phi> ?m ?c \<noteq> f ?c" by auto
+    then have "amalgamation (the (f 0)) (the (f 1)) ?c \<noteq> f ?c"
+      using amalgamate by simp
+    then have *: "Some (pdec2 (the (parallel (the (f 0)) (the (f 1)) ?c))) \<noteq> f ?c"
+      using amalgamation_def by (metis assms parallel_converg_V01)
+    let ?p = "parallel (the (f 0)) (the (f 1)) ?c"
+    show ?thesis
+    proof (cases "pdec1 (the ?p) = 0")
+      case True
+      then have "\<phi> (the (f 0)) ?c \<down>= pdec2 (the ?p)"
+        using assms parallel_0 parallel_converg_V01
+        by (metis option.collapse prod.collapse prod_decode_inverse)
+      then have "\<phi> (the (f 0)) ?c \<noteq> f ?c"
+        using * by simp
+      then have "\<phi> (the (f 0)) \<noteq> f" by auto
+      then have "\<phi> (the (f 1)) = f"
+        using assms V01_def by auto
+      moreover have "s\<^bsub>01\<^esub> (f \<triangleright> n) = f 1"
+        using True less n_gr_0 sv01 assms by simp
+      ultimately show ?thesis by simp
+    next
+      case False
+      then have "pdec1 (the ?p) = 1"
+        by (meson assms parallel_converg_V01 parallel_converg_pdec1_0_or_1)
+      then have "\<phi> (the (f 1)) ?c \<down>= pdec2 (the ?p)"
+        using assms parallel_1 parallel_converg_V01
+        by (metis option.collapse prod.collapse prod_decode_inverse)
+      then have "\<phi> (the (f 1)) ?c \<noteq> f ?c"
+        using * by simp
+      then have "\<phi> (the (f 1)) \<noteq> f" by auto
+      then have "\<phi> (the (f 0)) = f"
+        using assms V01_def by auto
+      moreover from False less n_gr_0 sv01 assms have "s\<^bsub>01\<^esub> (f \<triangleright> n) = f 0"
+        by simp
+      ultimately show ?thesis by simp
+    qed
+  qed
+qed
+
+text \<open>The final part of the correctness is @{term "sv01"} converging
+for all functions in @{term "V\<^sub>0\<^sub>1"}.\<close>
+
+lemma sv01_limit_V01:
+ assumes "f \<in> V\<^sub>0\<^sub>1"
+ shows "\<exists>i. \<forall>\<^sup>\<infinity>n. s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>= i"
+proof (cases "\<forall>n>0. s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>= amalgamate (the (f 0)) (the (f 1))")
+  case True
+  then show ?thesis by (meson less_le_trans zero_less_one)
+next
+  case False
+  then obtain n\<^sub>0 where n0:
+    "n\<^sub>0 \<noteq> 0"
+    "s\<^bsub>01\<^esub> (f \<triangleright> n\<^sub>0) \<down>\<noteq> amalg01 f"
+    using \<open>f \<in> V\<^sub>0\<^sub>1\<close> sv01_converg_V01 by blast
+  then have *: "the (inconsist (amalg01 f) (f \<triangleright> n\<^sub>0)) < Suc n\<^sub>0"
+      (is "the (inconsist ?m (f \<triangleright> n\<^sub>0)) < Suc n\<^sub>0")
+    using assms `n\<^sub>0 \<noteq> 0` sv01(2) inconsist_bounded inconsist_for_V01 length_init
+    by (metis (no_types, lifting) le_neq_implies_less option.collapse option.simps(3))
+  moreover have "f \<in> \<R>"
+    using assms V01_def by auto
+  moreover have "\<phi> ?m \<in> \<R>"
+    using amalgamate amalgamation_V01_R1 assms by auto
+  moreover have "inconsist ?m (f \<triangleright> n\<^sub>0) \<down>"
+    using inconsist_for_V01 assms by blast
+  ultimately have **: "inconsist ?m (f \<triangleright> (n\<^sub>0 + m)) = inconsist ?m (f \<triangleright> n\<^sub>0)" for m
+    using inconsist_init_converg_less[of f ?m] by simp
+  then have "the (inconsist ?m (f \<triangleright> (n\<^sub>0 + m))) < Suc n\<^sub>0 + m" for m
+    using * by auto
+  moreover have
+    "pdec1 (the (parallel (the (f 0)) (the (f 1)) (the (inconsist ?m (f \<triangleright> (n\<^sub>0 + m)))))) =
+      pdec1 (the (parallel (the (f 0)) (the (f 1)) (the (inconsist ?m (f \<triangleright> n\<^sub>0)))))"
+    for m
+    using ** by auto
+  moreover have "n\<^sub>0 + m \<noteq> 0" for m
+    using `n\<^sub>0 \<noteq> 0` by simp
+  ultimately have "s\<^bsub>01\<^esub> (f \<triangleright> (n\<^sub>0 + m)) = s\<^bsub>01\<^esub> (f \<triangleright> n\<^sub>0)" for m
+    using assms sv01 * \<open>n\<^sub>0 \<noteq> 0\<close> by (metis add_Suc)
+  moreover define i where "i = s\<^bsub>01\<^esub> (f \<triangleright> n\<^sub>0)"
+  ultimately have "\<forall>n\<ge>n\<^sub>0. s\<^bsub>01\<^esub> (f \<triangleright> n) = i"
+    using nat_le_iff_add by auto
+  then have "\<forall>n\<ge>n\<^sub>0. s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>= the i"
+    using n0(2) by simp
+  then show ?thesis by auto
+qed
+
+lemma V01_learn_cons: "learn_cons \<phi> V\<^sub>0\<^sub>1 s\<^bsub>01\<^esub>"
+proof (rule learn_consI2)
+  show "environment \<phi> V\<^sub>0\<^sub>1 s\<^bsub>01\<^esub>"
+    by (simp add: Collect_mono V01_def phi_in_P2 sv01_in_P1 sv01_converg_V01)
+  show "\<And>f n. f \<in> V\<^sub>0\<^sub>1 \<Longrightarrow> \<forall>k\<le>n. \<phi> (the (s\<^bsub>01\<^esub> (f \<triangleright> n))) k = f k"
+    using sv01_consistent_V01 .
+  show "\<exists>i n\<^sub>0. \<forall>n\<ge>n\<^sub>0. s\<^bsub>01\<^esub> (f \<triangleright> n) \<down>= i" if "f \<in> V\<^sub>0\<^sub>1" for f
+    using sv01_limit_V01 that by simp
+qed
+
+corollary V01_in_CONS: "V\<^sub>0\<^sub>1 \<in> CONS"
+  using V01_learn_cons CONS_def by auto
+
+text \<open>Now we can show the main result of this section, namely that
+there is a consistently learnable class that cannot be learned consistently
+by a total strategy. In other words, there is no Lemma~R for CONS.\<close>
+
+lemma no_lemma_R_for_CONS: "\<exists>U. U \<in> CONS \<and> (\<not> (\<exists>s. s \<in> \<R> \<and> learn_cons \<phi> U s))"
+  using V01_in_CONS V01_not_in_R_cons by auto
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/Partial_Recursive.thy b/thys/Inductive_Inference/Partial_Recursive.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/Partial_Recursive.thy
@@ -0,0 +1,1914 @@
+chapter \<open>Partial recursive functions\<close>
+
+theory Partial_Recursive
+  imports Main "HOL-Library.Nat_Bijection"
+begin
+
+text \<open>This chapter lays the foundation for Chapter~\ref{c:iirf}.
+Essentially it develops recursion theory up to the point of certain
+fixed-point theorems. This in turn requires standard results such as the
+existence of a universal function and the $s$-$m$-$n$ theorem. Besides these,
+the chapter contains some results, mostly regarding decidability and the
+Kleene normal form, that are not strictly needed later. They are included as
+relatively low-hanging fruits to round off the chapter.
+
+The formalization of partial recursive functions is very much inspired by the
+Universal Turing Machine AFP entry by Xu
+et~al.~\cite{Universal_Turing_Machine-AFP}. It models partial recursive
+functions as algorithms whose semantics is given by an evaluation function.
+This works well for most of this chapter. For the next chapter, however, it
+is beneficial to regard partial recursive functions as ``proper'' partial
+functions. To that end, Section~\ref{s:alternative} introduces more
+conventional and convenient notation for the common special cases of unary
+and binary partial recursive functions.
+
+Especially for the nontrivial proofs I consulted the classical textbook by
+Rogers~\cite{Rogers87}, which also partially explains my preferring the
+traditional term ``recursive'' to the more modern ``computable''.\<close>
+
+
+section \<open>Basic definitions\<close>
+
+
+subsection \<open>Partial recursive functions\<close>
+
+text \<open>To represent partial recursive functions we start from the same
+datatype as Xu et~al.~\cite{Universal_Turing_Machine-AFP}, more specifically
+from Urban's version of the formalization. In fact the datatype @{text recf}
+and the function @{text arity} below have been copied verbatim from it.\<close>
+
+datatype recf =
+  Z
+| S
+| Id nat nat
+| Cn nat recf "recf list"
+| Pr nat recf recf
+| Mn nat recf
+
+fun arity :: "recf \<Rightarrow> nat" where
+  "arity Z = 1"
+| "arity S = 1"
+| "arity (Id m n) = m"
+| "arity (Cn n f gs) = n"
+| "arity (Pr n f g) = Suc n"
+| "arity (Mn n f) = n"
+
+text \<open>Already we deviate from Xu et~al.\ in that we define a
+well-formedness predicate for partial recursive functions. Well-formedness
+essentially means arity constraints are respected when combining @{typ
+recf}s.\<close>
+
+fun wellf :: "recf \<Rightarrow> bool" where
+  "wellf Z = True"
+| "wellf S = True"
+| "wellf (Id m n) = (n < m)"
+| "wellf (Cn n f gs) =
+    (n > 0 \<and> (\<forall>g \<in> set gs. arity g = n \<and> wellf g) \<and> arity f = length gs \<and> wellf f)"
+| "wellf (Pr n f g) =
+    (arity g = Suc (Suc n) \<and> arity f = n \<and> wellf f \<and> wellf g)"
+| "wellf (Mn n f) = (n > 0 \<and> arity f = Suc n \<and> wellf f)"
+
+lemma wellf_arity_nonzero: "wellf f \<Longrightarrow> arity f > 0"
+  by (induction f rule: arity.induct) simp_all
+
+lemma wellf_Pr_arity_greater_1: "wellf (Pr n f g) \<Longrightarrow> arity (Pr n f g) > 1"
+  using wellf_arity_nonzero by auto
+
+text \<open>For the most part of this chapter this is the meaning of ``$f$
+is an $n$-ary partial recursive function'':\<close>
+
+abbreviation recfn :: "nat \<Rightarrow> recf \<Rightarrow> bool" where
+  "recfn n f \<equiv> wellf f \<and> arity f = n"
+
+text \<open>Some abbreviations for working with @{typ "nat option"}:\<close>
+
+abbreviation divergent :: "nat option \<Rightarrow> bool" ("_ \<up>" [50] 50) where
+  "x \<up> \<equiv> x = None"
+
+abbreviation convergent :: "nat option \<Rightarrow> bool" ("_ \<down>" [50] 50) where
+  "x \<down> \<equiv> x \<noteq> None"
+
+abbreviation convergent_eq :: "nat option \<Rightarrow> nat \<Rightarrow> bool" (infix "\<down>=" 50) where
+  "x \<down>= y \<equiv> x = Some y"
+
+abbreviation convergent_neq :: "nat option \<Rightarrow> nat \<Rightarrow> bool" (infix "\<down>\<noteq>" 50) where
+  "x \<down>\<noteq> y \<equiv> x \<down> \<and> x \<noteq> Some y"
+
+text \<open>In prose the terms ``halt'', ``terminate'', ``converge'', and
+``defined'' will be used interchangeably; likewise for ``not halt'',
+``diverge'', and ``undefined''. In names of lemmas, the abbreviations @{text
+converg} and @{text diverg} will be used consistently.\<close>
+
+text \<open>Our second major deviation from Xu
+et~al.~\cite{Universal_Turing_Machine-AFP} is that we model the semantics of
+a @{typ recf} by combining the value and the termination of a function into
+one evaluation function with codomain @{typ "nat option"}, rather than
+separating both aspects into an evaluation function with codomain @{typ nat}
+and a termination predicate.
+
+The value of a well-formed partial recursive function applied to a
+correctly-sized list of arguments:\<close>
+
+fun eval_wellf :: "recf \<Rightarrow> nat list \<Rightarrow> nat option" where
+  "eval_wellf Z xs \<down>= 0"
+| "eval_wellf S xs \<down>= Suc (xs ! 0)"
+| "eval_wellf (Id m n) xs \<down>= xs ! n"
+| "eval_wellf (Cn n f gs) xs =
+   (if \<forall>g \<in> set gs. eval_wellf g xs \<down>
+    then eval_wellf f (map (\<lambda>g. the (eval_wellf g xs)) gs)
+    else None)"
+| "eval_wellf (Pr n f g) [] = undefined"
+| "eval_wellf (Pr n f g) (0 # xs) = eval_wellf f xs"
+| "eval_wellf (Pr n f g) (Suc x # xs) =
+   Option.bind (eval_wellf (Pr n f g) (x # xs)) (\<lambda>v. eval_wellf g (x # v # xs))"
+| "eval_wellf (Mn n f) xs =
+   (let E = \<lambda>z. eval_wellf f (z # xs)
+    in if \<exists>z. E z \<down>= 0 \<and> (\<forall>y<z. E y \<down>)
+       then Some (LEAST z. E z \<down>= 0 \<and> (\<forall>y<z. E y \<down>))
+       else None)"
+
+text \<open>We define a function value only if the @{typ recf} is well-formed
+and its arity matches the number of arguments.\<close>
+
+definition eval :: "recf \<Rightarrow> nat list \<Rightarrow> nat option" where
+  "recfn (length xs) f \<Longrightarrow> eval f xs \<equiv> eval_wellf f xs"
+
+lemma eval_Z [simp]: "eval Z [x] \<down>= 0"
+  by (simp add: eval_def)
+
+lemma eval_Z' [simp]: "length xs = 1 \<Longrightarrow> eval Z xs \<down>= 0"
+  by (simp add: eval_def)
+
+lemma eval_S [simp]: "eval S [x] \<down>= Suc x"
+  by (simp add: eval_def)
+
+lemma eval_S' [simp]: "length xs = 1 \<Longrightarrow> eval S xs \<down>= Suc (hd xs)"
+  using eval_def hd_conv_nth[of xs] by fastforce
+
+lemma eval_Id [simp]:
+  assumes "n < m" and "m = length xs"
+  shows "eval (Id m n) xs \<down>= xs ! n"
+  using assms by (simp add: eval_def)
+
+lemma eval_Cn [simp]:
+  assumes "recfn (length xs) (Cn n f gs)"
+  shows "eval (Cn n f gs) xs =
+    (if \<forall>g\<in>set gs. eval g xs \<down>
+     then eval f (map (\<lambda>g. the (eval g xs)) gs)
+     else None)"
+proof -
+  have "eval (Cn n f gs) xs = eval_wellf (Cn n f gs) xs"
+    using assms eval_def by blast
+  moreover have "\<And>g. g \<in> set gs \<Longrightarrow> eval_wellf g xs = eval g xs"
+    using assms eval_def by simp
+  ultimately have "eval (Cn n f gs) xs =
+    (if \<forall>g\<in>set gs. eval g xs \<down>
+     then eval_wellf f (map (\<lambda>g. the (eval g xs)) gs)
+     else None)"
+    using map_eq_conv[of "\<lambda>g. the (eval_wellf g xs)" gs "\<lambda>g. the (eval g xs)"]
+    by (auto, metis)
+  moreover have "\<And>ys. length ys = length gs \<Longrightarrow> eval f ys = eval_wellf f ys"
+    using assms eval_def by simp
+  ultimately show ?thesis by auto
+qed
+
+lemma eval_Pr_0 [simp]:
+  assumes "recfn (Suc n) (Pr n f g)" and "n = length xs"
+  shows "eval (Pr n f g) (0 # xs) = eval f xs"
+  using assms by (simp add: eval_def)
+
+lemma eval_Pr_diverg_Suc [simp]:
+  assumes "recfn (Suc n) (Pr n f g)"
+    and "n = length xs"
+    and "eval (Pr n f g) (x # xs) \<up>"
+  shows "eval (Pr n f g) (Suc x # xs) \<up>"
+  using assms by (simp add: eval_def)
+
+lemma eval_Pr_converg_Suc [simp]:
+  assumes "recfn (Suc n) (Pr n f g)"
+    and "n = length xs"
+    and "eval (Pr n f g) (x # xs) \<down>"
+  shows "eval (Pr n f g) (Suc x # xs) = eval g (x # the (eval (Pr n f g) (x # xs)) # xs)"
+  using assms eval_def by auto
+
+lemma eval_Pr_diverg_add:
+  assumes "recfn (Suc n) (Pr n f g)"
+    and "n = length xs"
+    and "eval (Pr n f g) (x # xs) \<up>"
+  shows "eval (Pr n f g) ((x + y) # xs) \<up>"
+  using assms by (induction y) auto
+
+lemma eval_Pr_converg_le:
+  assumes "recfn (Suc n) (Pr n f g)"
+    and "n = length xs"
+    and "eval (Pr n f g) (x # xs) \<down>"
+    and "y \<le> x"
+  shows "eval (Pr n f g) (y # xs) \<down>"
+  using assms eval_Pr_diverg_add le_Suc_ex by metis
+
+lemma eval_Pr_Suc_converg:
+  assumes "recfn (Suc n) (Pr n f g)"
+    and "n = length xs"
+    and "eval (Pr n f g) (Suc x # xs) \<down>"
+  shows "eval g (x # (the (eval (Pr n f g) (x # xs))) # xs) \<down>"
+    and "eval (Pr n f g) (Suc x # xs) = eval g (x # the (eval (Pr n f g) (x # xs)) # xs)"
+  using eval_Pr_converg_Suc[of n f g xs x, OF assms(1,2)]
+    eval_Pr_converg_le[of n f g xs "Suc x" x, OF assms] assms(3)
+  by simp_all
+
+lemma eval_Mn [simp]:
+  assumes "recfn (length xs) (Mn n f)"
+  shows "eval (Mn n f) xs =
+   (if (\<exists>z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>))
+    then Some (LEAST z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>))
+    else None)"
+  using assms eval_def by auto
+
+text \<open>For $\mu$-recursion, the condition @{term "(\<forall>y<z. eval_wellf f (y # xs) \<down>)"}
+inside @{text LEAST} in the definition of @{term eval_wellf} is redundant.\<close>
+
+lemma eval_wellf_Mn:
+  "eval_wellf (Mn n f) xs =
+    (if (\<exists>z. eval_wellf f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval_wellf f (y # xs) \<down>))
+     then Some (LEAST z. eval_wellf f (z # xs) \<down>= 0)
+     else None)"
+proof -
+  let ?P = "\<lambda>z. eval_wellf f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval_wellf f (y # xs) \<down>)"
+  {
+    assume "\<exists>z. ?P z"
+    moreover define z where "z = Least ?P"
+    ultimately have "?P z"
+      using LeastI[of ?P] by blast
+    have "(LEAST z. eval_wellf f (z # xs) \<down>= 0) = z"
+    proof (rule Least_equality)
+      show "eval_wellf f (z # xs) \<down>= 0"
+        using `?P z` by simp
+      show "z \<le> y" if "eval_wellf f (y # xs) \<down>= 0" for y
+      proof (rule ccontr)
+        assume "\<not> z \<le> y"
+        then have "y < z" by simp
+        moreover from this have "?P y"
+          using that `?P z` by simp
+        ultimately show False
+          using that not_less_Least z_def by blast
+      qed
+    qed
+  }
+  then show ?thesis by simp
+qed
+
+lemma eval_Mn':
+  assumes "recfn (length xs) (Mn n f)"
+  shows "eval (Mn n f) xs =
+   (if (\<exists>z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>))
+    then Some (LEAST z. eval f (z # xs) \<down>= 0)
+    else None)"
+  using assms eval_def eval_wellf_Mn by auto
+
+text \<open>Proving that $\mu$-recursion converges is easier if one does not
+have to deal with @{text LEAST} directly.\<close>
+
+lemma eval_Mn_convergI:
+  assumes "recfn (length xs) (Mn n f)"
+    and "eval f (z # xs) \<down>= 0"
+    and "\<And>y. y < z \<Longrightarrow> eval f (y # xs) \<down>\<noteq> 0"
+  shows "eval (Mn n f) xs \<down>= z"
+proof -
+  let ?P = "\<lambda>z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>)"
+  have "z = Least ?P"
+    using Least_equality[of ?P z] assms(2,3) not_le_imp_less by blast
+  moreover have "?P z" using assms(2,3) by simp
+  ultimately show "eval (Mn n f) xs \<down>= z"
+    using eval_Mn[OF assms(1)] by meson
+qed
+
+text \<open>Similarly, reasoning from a $\mu$-recursive function is
+simplified somewhat by the next lemma.\<close>
+
+lemma eval_Mn_convergE:
+  assumes "recfn (length xs) (Mn n f)" and "eval (Mn n f) xs \<down>= z"
+  shows "z = (LEAST z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>))"
+    and "eval f (z # xs) \<down>= 0"
+    and "\<And>y. y < z \<Longrightarrow> eval f (y # xs) \<down>\<noteq> 0"
+proof -
+  let ?P = "\<lambda>z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>)"
+  show "z = Least ?P"
+    using assms eval_Mn[OF assms(1)]
+    by (metis (no_types, lifting) option.inject option.simps(3))
+  moreover have "\<exists>z. ?P z"
+    using assms eval_Mn[OF assms(1)] by (metis option.distinct(1))
+  ultimately have "?P z"
+    using LeastI[of ?P] by blast
+  then have "eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>)"
+    by simp
+  then show "eval f (z # xs) \<down>= 0" by simp
+  show "\<And>y. y < z \<Longrightarrow> eval f (y # xs) \<down>\<noteq> 0"
+    using not_less_Least[of _ ?P] `z = Least ?P` `?P z` less_trans by blast
+qed
+
+lemma eval_Mn_diverg:
+  assumes "recfn (length xs) (Mn n f)"
+  shows "\<not> (\<exists>z. eval f (z # xs) \<down>= 0 \<and> (\<forall>y<z. eval f (y # xs) \<down>)) \<longleftrightarrow> eval (Mn n f) xs \<up>"
+  using assms eval_Mn[OF assms(1)] by simp
+
+
+subsection \<open>Extensional equality\<close>
+
+definition exteq :: "recf \<Rightarrow> recf \<Rightarrow> bool" (infix "\<simeq>" 55) where
+  "f \<simeq> g \<equiv> arity f = arity g \<and> (\<forall>xs. length xs = arity f \<longrightarrow> eval f xs = eval g xs)"
+
+lemma exteq_refl: "f \<simeq> f"
+  using exteq_def by simp
+
+lemma exteq_sym: "f \<simeq> g \<Longrightarrow> g \<simeq> f"
+  using exteq_def by simp
+
+lemma exteq_trans: "f \<simeq> g \<Longrightarrow> g \<simeq> h \<Longrightarrow> f \<simeq> h"
+  using exteq_def by simp
+
+lemma exteqI:
+  assumes "arity f = arity g" and "\<And>xs. length xs = arity f \<Longrightarrow> eval f xs = eval g xs"
+  shows "f \<simeq> g"
+  using assms exteq_def by simp
+
+lemma exteqI1:
+  assumes "arity f = 1" and "arity g = 1" and "\<And>x. eval f [x] = eval g [x]"
+  shows "f \<simeq> g"
+  using assms exteqI by (metis One_nat_def Suc_length_conv length_0_conv)
+
+text \<open>For every partial recursive function @{term f} there are
+infinitely many extensionally equal ones, for example, those that wrap @{term
+f} arbitrarily often in the identity function.\<close>
+
+fun wrap_Id :: "recf \<Rightarrow> nat \<Rightarrow> recf" where
+  "wrap_Id f 0 = f"
+| "wrap_Id f (Suc n) = Cn (arity f) (Id 1 0) [wrap_Id f n]"
+
+lemma recfn_wrap_Id: "recfn a f \<Longrightarrow> recfn a (wrap_Id f n)"
+  using wellf_arity_nonzero by (induction n) auto
+
+lemma exteq_wrap_Id: "recfn a f \<Longrightarrow> f \<simeq> wrap_Id f n"
+proof (induction n)
+  case 0
+  then show ?case by (simp add: exteq_refl)
+next
+  case (Suc n)
+  have "wrap_Id f n \<simeq> wrap_Id f (Suc n) "
+  proof (rule exteqI)
+    show "arity (wrap_Id f n) = arity (wrap_Id f (Suc n))"
+      using Suc by (simp add: recfn_wrap_Id)
+    show "eval (wrap_Id f n) xs = eval (wrap_Id f (Suc n)) xs"
+      if "length xs = arity (wrap_Id f n)" for xs
+    proof -
+      have "recfn (length xs) (Cn (arity f) (Id 1 0) [wrap_Id f n])"
+        using that Suc recfn_wrap_Id by (metis wrap_Id.simps(2))
+      then show "eval (wrap_Id f n) xs = eval (wrap_Id f (Suc n)) xs"
+        by auto
+    qed
+  qed
+  then show ?case using Suc exteq_trans by fast
+qed
+
+fun depth :: "recf \<Rightarrow> nat" where
+  "depth Z = 0"
+| "depth S = 0"
+| "depth (Id m n) = 0"
+| "depth (Cn n f gs) = Suc (max (depth f) (Max (set (map depth gs))))"
+| "depth (Pr n f g) = Suc (max (depth f) (depth g))"
+| "depth (Mn n f) = Suc (depth f)"
+
+lemma depth_wrap_Id: "recfn a f \<Longrightarrow> depth (wrap_Id f n) = depth f + n"
+  by (induction n) simp_all
+
+lemma wrap_Id_injective:
+  assumes "recfn a f" and "wrap_Id f n\<^sub>1 = wrap_Id f n\<^sub>2"
+  shows "n\<^sub>1 = n\<^sub>2"
+  using assms by (metis add_left_cancel depth_wrap_Id)
+
+lemma exteq_infinite:
+  assumes "recfn a f"
+  shows "infinite {g. recfn a g \<and> g \<simeq> f}" (is "infinite ?R")
+proof -
+  have "inj (wrap_Id f)"
+    using wrap_Id_injective `recfn a f` by (meson inj_onI)
+  then have "infinite (range (wrap_Id f))"
+    using finite_imageD by blast
+  moreover have "range (wrap_Id f) \<subseteq> ?R"
+    using assms exteq_sym exteq_wrap_Id recfn_wrap_Id by blast
+  ultimately show ?thesis by (simp add: infinite_super)
+qed
+
+
+subsection \<open>Primitive recursive and total functions\<close>
+
+fun Mn_free :: "recf \<Rightarrow> bool" where
+  "Mn_free Z = True"
+| "Mn_free S = True"
+| "Mn_free (Id m n) = True"
+| "Mn_free (Cn n f gs) = ((\<forall>g \<in> set gs. Mn_free g) \<and> Mn_free f)"
+| "Mn_free (Pr n f g) = (Mn_free f \<and> Mn_free g)"
+| "Mn_free (Mn n f) = False"
+
+text \<open>This is our notion of $n$-ary primitive recursive function:\<close>
+
+abbreviation prim_recfn :: "nat \<Rightarrow> recf \<Rightarrow> bool" where
+  "prim_recfn n f \<equiv> recfn n f \<and> Mn_free f"
+
+definition total :: "recf \<Rightarrow> bool" where
+  "total f \<equiv> \<forall>xs. length xs = arity f \<longrightarrow> eval f xs \<down>"
+
+lemma totalI [intro]:
+  assumes "\<And>xs. length xs = arity f \<Longrightarrow> eval f xs \<down>"
+  shows "total f"
+  using assms total_def by simp
+
+lemma totalE [simp]:
+  assumes "total f" and "recfn n f" and "length xs = n"
+  shows "eval f xs \<down>"
+  using assms total_def by simp
+
+lemma totalI1 :
+  assumes "recfn 1 f" and "\<And>x. eval f [x] \<down>"
+  shows "total f"
+  using assms totalI[of f] by (metis One_nat_def length_0_conv length_Suc_conv)
+
+lemma totalI2:
+  assumes "recfn 2 f" and "\<And>x y. eval f [x, y] \<down>"
+  shows "total f"
+  using assms totalI[of f] by (smt length_0_conv length_Suc_conv numeral_2_eq_2)
+
+lemma totalI3:
+  assumes "recfn 3 f" and "\<And>x y z. eval f [x, y, z] \<down>"
+  shows "total f"
+  using assms totalI[of f] by (smt length_0_conv length_Suc_conv numeral_3_eq_3)
+
+lemma totalI4:
+  assumes "recfn 4 f" and "\<And>w x y z. eval f [w, x, y, z] \<down>"
+  shows "total f"
+proof (rule totalI[of f])
+  fix xs :: "nat list"
+  assume "length xs = arity f"
+  then have "length xs = Suc (Suc (Suc (Suc 0)))"
+    using assms(1) by simp
+  then obtain w x y z where "xs = [w, x, y, z]"
+    by (smt Suc_length_conv length_0_conv)
+  then show "eval f xs \<down>" using assms(2) by simp
+qed
+
+lemma Mn_free_imp_total [intro]:
+  assumes "wellf f" and "Mn_free f"
+  shows "total f"
+  using assms
+proof (induction f rule: Mn_free.induct)
+  case (5 n f g)
+  have "eval (Pr n f g) (x # xs) \<down>" if "length (x # xs) = arity (Pr n f g)" for x xs
+    using 5 that by (induction x) auto
+  then show ?case by (metis arity.simps(5) length_Suc_conv totalI)
+qed (auto simp add: total_def eval_def)
+
+lemma prim_recfn_total: "prim_recfn n f \<Longrightarrow> total f"
+  using Mn_free_imp_total by simp
+
+lemma eval_Pr_prim_Suc:
+  assumes "h = Pr n f g" and "prim_recfn (Suc n) h" and "length xs = n"
+  shows "eval h (Suc x # xs) = eval g (x # the (eval h (x # xs)) # xs)"
+  using assms eval_Pr_converg_Suc prim_recfn_total by simp
+
+lemma Cn_total:
+  assumes "\<forall>g\<in>set gs. total g" and "total f" and "recfn n (Cn n f gs)"
+  shows "total (Cn n f gs)"
+  using assms by (simp add: totalI)
+
+lemma Pr_total:
+  assumes "total f" and "total g" and "recfn (Suc n) (Pr n f g)"
+  shows "total (Pr n f g)"
+proof -
+  have "eval (Pr n f g) (x # xs) \<down>" if "length xs = n" for x xs
+    using that assms by (induction x) auto
+  then show ?thesis
+    using assms(3) totalI by (metis Suc_length_conv arity.simps(5))
+qed
+
+lemma eval_Mn_total:
+  assumes "recfn (length xs) (Mn n f)" and "total f"
+  shows "eval (Mn n f) xs =
+    (if (\<exists>z. eval f (z # xs) \<down>= 0)
+     then Some (LEAST z. eval f (z # xs) \<down>= 0)
+     else None)"
+  using assms by auto
+
+
+section \<open>Simple functions\<close>
+
+text \<open>This section, too, bears some similarity to Urban's formalization
+in Xu et~al.~\cite{Universal_Turing_Machine-AFP}, but is more minimalistic in
+scope.
+
+As a general naming rule, instances of @{typ recf} and functions
+returning such instances get names starting with @{text r_}. Typically, for
+an @{text r_xyz} there will be a lemma @{text r_xyz_recfn} or @{text
+r_xyz_prim} establishing its (primitive) recursiveness, arity, and
+well-formedness. Moreover there will be a lemma @{text r_xyz} describing its
+semantics, for which we will sometimes introduce an Isabelle function @{text
+xyz}.\<close>
+
+
+subsection \<open>Manipulating parameters\<close>
+
+text \<open>Appending dummy parameters:\<close>
+
+definition r_dummy :: "nat \<Rightarrow> recf \<Rightarrow> recf" where
+  "r_dummy n f \<equiv> Cn (arity f + n) f (map (\<lambda>i. Id (arity f + n) i) [0..<arity f])"
+
+lemma r_dummy_prim [simp]:
+  "prim_recfn a f \<Longrightarrow> prim_recfn (a + n) (r_dummy n f)"
+  using wellf_arity_nonzero by (auto simp add: r_dummy_def)
+
+lemma r_dummy_recfn [simp]:
+  "recfn a f \<Longrightarrow> recfn (a + n) (r_dummy n f)"
+  using wellf_arity_nonzero by (auto simp add: r_dummy_def)
+
+lemma r_dummy [simp]:
+  "r_dummy n f = Cn (arity f + n) f (map (\<lambda>i. Id (arity f + n) i) [0..<arity f])"
+  unfolding r_dummy_def by simp
+
+lemma r_dummy_append:
+  assumes "recfn (length xs) f" and "length ys = n"
+  shows "eval (r_dummy n f) (xs @ ys) = eval f xs"
+proof -
+  let ?r = "r_dummy n f"
+  let ?gs = "map (\<lambda>i. Id (arity f + n) i) [0..<arity f]"
+  have "length ?gs = arity f" by simp
+  moreover have "?gs ! i = (Id (arity f + n) i)" if "i < arity f" for i
+    by (simp add: that)
+  moreover have *: "eval_wellf (?gs ! i) (xs @ ys) \<down>= xs ! i" if "i < arity f" for i
+    using that assms by (simp add: nth_append)
+  ultimately have "map (\<lambda>g. the (eval_wellf g (xs @ ys))) ?gs = xs"
+    by (metis (no_types, lifting) assms(1) length_map nth_equalityI nth_map option.sel)
+  moreover have "\<forall>g \<in> set ?gs. eval_wellf g (xs @ ys) \<down>"
+    using * by simp
+  moreover have "recfn (length (xs @ ys)) ?r"
+    using assms r_dummy_recfn by fastforce
+  ultimately show ?thesis
+    by (auto simp add: assms eval_def)
+qed
+
+text \<open>Shrinking a binary function to a unary one is useful when we want
+to define a unary function via the @{term Pr} operation, which can only
+construct @{typ recf}s of arity two or higher.\<close>
+
+definition r_shrink :: "recf \<Rightarrow> recf" where
+  "r_shrink f \<equiv> Cn 1 f [Id 1 0, Id 1 0]"
+
+lemma r_shrink_prim [simp]: "prim_recfn 2 f \<Longrightarrow> prim_recfn 1 (r_shrink f)"
+  by (simp add: r_shrink_def)
+
+lemma r_shrink_recfn [simp]: "recfn 2 f \<Longrightarrow> recfn 1 (r_shrink f)"
+  by (simp add: r_shrink_def)
+
+lemma r_shrink [simp]: "recfn 2 f \<Longrightarrow> eval (r_shrink f) [x] = eval f [x, x]"
+  by (simp add: r_shrink_def)
+
+definition r_swap :: "recf \<Rightarrow> recf" where
+  "r_swap f \<equiv> Cn 2 f [Id 2 1, Id 2 0]"
+
+lemma r_swap_recfn [simp]: "recfn 2 f \<Longrightarrow> recfn 2 (r_swap f)"
+  by (simp add: r_swap_def)
+
+lemma r_swap_prim [simp]: "prim_recfn 2 f \<Longrightarrow> prim_recfn 2 (r_swap f)"
+  by (simp add: r_swap_def)
+
+lemma r_swap [simp]: "recfn 2 f \<Longrightarrow> eval (r_swap f) [x, y] = eval f [y, x]"
+  by (simp add: r_swap_def)
+
+text \<open>Prepending one dummy parameter:\<close>
+
+definition r_shift :: "recf \<Rightarrow> recf" where
+  "r_shift f \<equiv> Cn (Suc (arity f)) f (map (\<lambda>i. Id (Suc (arity f)) (Suc i)) [0..<arity f])"
+
+lemma r_shift_prim [simp]: "prim_recfn a f \<Longrightarrow> prim_recfn (Suc a) (r_shift f)"
+  by (simp add: r_shift_def)
+
+lemma r_shift_recfn [simp]: "recfn a f \<Longrightarrow> recfn (Suc a) (r_shift f)"
+  by (simp add: r_shift_def)
+
+lemma r_shift [simp]:
+  assumes "recfn (length xs) f"
+  shows "eval (r_shift f) (x # xs) = eval f xs"
+proof -
+  let ?r = "r_shift f"
+  let ?gs = "map (\<lambda>i. Id (Suc (arity f)) (Suc i)) [0..<arity f]"
+  have "length ?gs = arity f" by simp
+  moreover have "?gs ! i = (Id (Suc (arity f)) (Suc i))" if "i < arity f" for i
+    by (simp add: that)
+  moreover have *: "eval (?gs ! i) (x # xs) \<down>= xs ! i" if "i < arity f" for i
+    using assms nth_append that by simp
+  ultimately have "map (\<lambda>g. the (eval g (x # xs))) ?gs = xs"
+    by (metis (no_types, lifting) assms length_map nth_equalityI nth_map option.sel)
+  moreover have "\<forall>g \<in> set ?gs. eval g (x # xs) \<noteq> None"
+    using * by simp
+  ultimately show ?thesis using r_shift_def assms by simp
+qed
+
+
+subsection \<open>Arithmetic and logic\<close>
+
+text \<open>The unary constants:\<close>
+
+fun r_const :: "nat \<Rightarrow> recf" where
+  "r_const 0 = Z"
+| "r_const (Suc c) = Cn 1 S [r_const c]"
+
+lemma r_const_prim [simp]: "prim_recfn 1 (r_const c)"
+  by (induction c) (simp_all)
+
+lemma r_const [simp]: "eval (r_const c) [x] \<down>= c"
+  by (induction c) simp_all
+
+text \<open>Constants of higher arities:\<close>
+
+definition "r_constn n c \<equiv> if n = 0 then r_const c else r_dummy n (r_const c)"
+
+lemma r_constn_prim [simp]: "prim_recfn (Suc n) (r_constn n c)"
+  unfolding r_constn_def by simp
+
+lemma r_constn [simp]: "length xs = Suc n \<Longrightarrow> eval (r_constn n c) xs \<down>= c"
+  unfolding r_constn_def
+  by simp (metis length_0_conv length_Suc_conv r_const)
+
+text \<open>We introduce addition, subtraction, and multiplication, but
+interestingly enough we can make do without division.\<close>
+
+definition "r_add \<equiv> Pr 1 (Id 1 0) (Cn 3 S [Id 3 1])"
+
+lemma r_add_prim [simp]: "prim_recfn 2 r_add"
+  by (simp add: r_add_def)
+
+lemma r_add [simp]: "eval r_add [a, b] \<down>= a + b"
+  unfolding r_add_def by (induction a) simp_all
+
+definition "r_mul \<equiv> Pr 1 Z (Cn 3 r_add [Id 3 1, Id 3 2])"
+
+lemma r_mul_prim [simp]: "prim_recfn 2 r_mul"
+  unfolding r_mul_def by simp
+
+lemma r_mul [simp]: "eval r_mul [a, b] \<down>= a * b"
+  unfolding r_mul_def by (induction a) simp_all
+
+definition "r_dec \<equiv> Cn 1 (Pr 1 Z (Id 3 0)) [Id 1 0, Id 1 0]"
+
+lemma r_dec_prim [simp]: "prim_recfn 1 r_dec"
+  by (simp add: r_dec_def)
+
+lemma r_dec [simp]: "eval r_dec [a] \<down>= a - 1"
+proof -
+  have "eval (Pr 1 Z (Id 3 0)) [x, y] \<down>= x - 1" for x y
+    by (induction x) simp_all
+  then show ?thesis by (simp add: r_dec_def)
+qed
+
+definition "r_sub \<equiv> r_swap (Pr 1 (Id 1 0) (Cn 3 r_dec [Id 3 1]))"
+
+lemma r_sub_prim [simp]: "prim_recfn 2 r_sub"
+  unfolding r_sub_def by simp
+
+lemma r_sub [simp]: "eval r_sub [a, b] \<down>= a - b"
+proof -
+  have "eval (Pr 1 (Id 1 0) (Cn 3 r_dec [Id 3 1])) [x, y] \<down>= y - x" for x y
+    by (induction x) simp_all
+  then show ?thesis unfolding r_sub_def by simp
+qed
+
+definition "r_sign \<equiv> r_shrink (Pr 1 Z (r_constn 2 1))"
+
+lemma r_sign_prim [simp]: "prim_recfn 1 r_sign"
+  unfolding r_sign_def by simp
+
+lemma r_sign [simp]: "eval r_sign [x] \<down>= (if x = 0 then 0 else 1)"
+proof -
+  have "eval (Pr 1 Z (r_constn 2 1)) [x, y] \<down>= (if x = 0 then 0 else 1)" for x y
+    by (induction x) simp_all
+  then show ?thesis unfolding r_sign_def by simp
+qed
+
+text \<open>In the logical functions, true will be represented by zero, and
+false will be represented by non-zero as argument and by one as
+result.\<close>
+
+definition "r_not \<equiv> Cn 1 r_sub [r_const 1, r_sign]"
+
+lemma r_not_prim [simp]: "prim_recfn 1 r_not"
+  unfolding r_not_def by simp
+
+lemma r_not [simp]: "eval r_not [x] \<down>= (if x = 0 then 1 else 0)"
+  unfolding r_not_def by simp
+
+definition "r_nand \<equiv> Cn 2 r_not [r_add]"
+
+lemma r_nand_prim [simp]: "prim_recfn 2 r_nand"
+  unfolding r_nand_def by simp
+
+lemma r_nand [simp]: "eval r_nand [x, y] \<down>= (if x = 0 \<and> y = 0 then 1 else 0)"
+  unfolding r_nand_def by simp
+
+definition "r_and \<equiv> Cn 2 r_not [r_nand]"
+
+lemma r_and_prim [simp]: "prim_recfn 2 r_and"
+  unfolding r_and_def by simp
+
+lemma r_and [simp]: "eval r_and [x, y] \<down>= (if x = 0 \<and> y = 0 then 0 else 1)"
+  unfolding r_and_def by simp
+
+definition "r_or \<equiv> Cn 2 r_sign [r_mul]"
+
+lemma r_or_prim [simp]: "prim_recfn 2 r_or"
+  unfolding r_or_def by simp
+
+lemma r_or [simp]: "eval r_or [x, y] \<down>= (if x = 0 \<or> y = 0 then 0 else 1)"
+  unfolding r_or_def by simp
+
+
+subsection \<open>Comparison and conditions\<close>
+
+definition "r_ifz \<equiv>
+  let ifzero = (Cn 3 r_mul [r_dummy 2 r_not, Id 3 1]);
+      ifnzero = (Cn 3 r_mul [r_dummy 2 r_sign, Id 3 2])
+  in Cn 3 r_add [ifzero, ifnzero]"
+
+lemma r_ifz_prim [simp]: "prim_recfn 3 r_ifz"
+  unfolding r_ifz_def by simp
+
+lemma r_ifz [simp]: "eval r_ifz [cond, val0, val1] \<down>= (if cond = 0 then val0 else val1)"
+  unfolding r_ifz_def by (simp add: Let_def)
+
+definition "r_eq \<equiv> Cn 2 r_sign [Cn 2 r_add [r_sub, r_swap r_sub]]"
+
+lemma r_eq_prim [simp]: "prim_recfn 2 r_eq"
+  unfolding r_eq_def by simp
+
+lemma r_eq [simp]: "eval r_eq [x, y] \<down>= (if x = y then 0 else 1)"
+  unfolding r_eq_def by simp
+
+definition "r_ifeq \<equiv> Cn 4 r_ifz [r_dummy 2 r_eq, Id 4 2, Id 4 3]"
+
+lemma r_ifeq_prim [simp]: "prim_recfn 4 r_ifeq"
+  unfolding r_ifeq_def by simp
+
+lemma r_ifeq [simp]: "eval r_ifeq [a, b, v\<^sub>0, v\<^sub>1] \<down>= (if a = b then v\<^sub>0 else v\<^sub>1)"
+  unfolding r_ifeq_def using r_dummy_append[of r_eq "[a, b]" "[v\<^sub>0, v\<^sub>1]" 2]
+  by simp
+
+definition "r_neq \<equiv> Cn 2 r_not [r_eq]"
+
+lemma r_neq_prim [simp]: "prim_recfn 2 r_neq"
+  unfolding r_neq_def by simp
+
+lemma r_neq [simp]: "eval r_neq [x, y] \<down>= (if x = y then 1 else 0)"
+  unfolding r_neq_def by simp
+
+definition "r_ifle \<equiv> Cn 4 r_ifz [r_dummy 2 r_sub, Id 4 2, Id 4 3]"
+
+lemma r_ifle_prim [simp]: "prim_recfn 4 r_ifle"
+  unfolding r_ifle_def by simp
+
+lemma r_ifle [simp]: "eval r_ifle [a, b, v\<^sub>0, v\<^sub>1] \<down>= (if a \<le> b then v\<^sub>0 else v\<^sub>1)"
+  unfolding r_ifle_def using r_dummy_append[of r_sub "[a, b]" "[v\<^sub>0, v\<^sub>1]" 2]
+  by simp
+
+definition "r_ifless \<equiv> Cn 4 r_ifle [Id 4 1, Id 4 0, Id 4 3, Id 4 2]"
+
+lemma r_ifless_prim [simp]: "prim_recfn 4 r_ifless"
+  unfolding r_ifless_def by simp
+
+lemma r_ifless [simp]: "eval r_ifless [a, b, v\<^sub>0, v\<^sub>1] \<down>= (if a < b then v\<^sub>0 else v\<^sub>1)"
+  unfolding r_ifless_def by simp
+
+definition "r_less \<equiv> Cn 2 r_ifle [Id 2 1, Id 2 0, r_constn 1 1, r_constn 1 0]"
+
+lemma r_less_prim [simp]: "prim_recfn 2 r_less"
+  unfolding r_less_def by simp
+
+lemma r_less [simp]: "eval r_less [x, y] \<down>= (if x < y then 0 else 1)"
+  unfolding r_less_def by simp
+
+definition "r_le \<equiv> Cn 2 r_ifle [Id 2 0, Id 2 1, r_constn 1 0, r_constn 1 1]"
+
+lemma r_le_prim [simp]: "prim_recfn 2 r_le"
+  unfolding r_le_def by simp
+
+lemma r_le [simp]: "eval r_le [x, y] \<down>= (if x \<le> y then 0 else 1)"
+  unfolding r_le_def by simp
+
+text \<open>Arguments are evaluated eagerly. Therefore @{term "r_ifz"}, etc.
+cannot be combined with a diverging function to implement a conditionally
+diverging function in the naive way. The following function implements a
+special case needed in the next section. A \hyperlink{p:r_lifz}{general lazy
+version} of @{term "r_ifz"} will be introduced later with the help of a
+universal function.\<close>
+
+definition "r_ifeq_else_diverg \<equiv>
+  Cn 3 r_add [Id 3 2, Mn 3 (Cn 4 r_add [Id 4 0, Cn 4 r_eq [Id 4 1, Id 4 2]])]"
+
+lemma r_ifeq_else_diverg_recfn [simp]: "recfn 3 r_ifeq_else_diverg"
+  unfolding r_ifeq_else_diverg_def by simp
+
+lemma r_ifeq_else_diverg [simp]:
+  "eval r_ifeq_else_diverg [a, b, v] = (if a = b then Some v else None)"
+  unfolding r_ifeq_else_diverg_def by simp
+
+
+section \<open>The halting problem\label{s:halting}\<close>
+
+text \<open>Decidability will be treated more thoroughly in
+Section~\ref{s:decidable}. But the halting problem is prominent enough to
+deserve an early mention.\<close>
+
+definition decidable :: "nat set \<Rightarrow> bool" where
+  "decidable X \<equiv> \<exists>f. recfn 1 f \<and> (\<forall>x. eval f [x] \<down>= (if x \<in> X then 1 else 0))"
+
+text \<open>No matter how partial recursive functions are encoded as natural
+numbers, the set of all codes of functions halting on their own code is
+undecidable.\<close>
+
+theorem halting_problem_undecidable:
+  fixes code :: "nat \<Rightarrow> recf"
+  assumes "\<And>f. recfn 1 f \<Longrightarrow> \<exists>i. code i = f"
+  shows "\<not> decidable {x. eval (code x) [x] \<down>}" (is "\<not> decidable ?K")
+proof
+  assume "decidable ?K"
+  then obtain f where "recfn 1 f" and f: "\<forall>x. eval f [x] \<down>= (if x \<in> ?K then 1 else 0)"
+    using decidable_def by auto
+  define g where "g \<equiv> Cn 1 r_ifeq_else_diverg [f, Z, Z]"
+  then have "recfn 1 g"
+    using `recfn 1 f` r_ifeq_else_diverg_recfn by simp
+  with assms obtain i where i: "code i = g" by auto
+  from g_def have "eval g [x] = (if x \<notin> ?K then Some 0 else None)" for x
+    using r_ifeq_else_diverg_recfn `recfn 1 f` f by simp
+  then have "eval g [i] \<down> \<longleftrightarrow> i \<notin> ?K" by simp
+  also have "... \<longleftrightarrow> eval (code i) [i] \<up>" by simp
+  also have "... \<longleftrightarrow> eval g [i] \<up>"
+    using i by simp
+  finally have "eval g [i] \<down> \<longleftrightarrow> eval g [i] \<up>" .
+  then show False by auto
+qed
+
+
+section \<open>Encoding tuples and lists\<close>
+
+text \<open>This section is based on the Cantor encoding for pairs. Tuples
+are encoded by repeated application of the pairing function, lists by pairing
+their length with the code for a tuple. Thus tuples have a fixed length that
+must be known when decoding, whereas lists are dynamically sized and know
+their current length.\<close>
+
+
+subsection \<open>Pairs and tuples\<close>
+
+
+subsubsection \<open>The Cantor pairing function\<close>
+
+definition "r_triangle \<equiv> r_shrink (Pr 1 Z (r_dummy 1 (Cn 2 S [r_add])))"
+
+lemma r_triangle_prim: "prim_recfn 1 r_triangle"
+  unfolding r_triangle_def by simp
+
+lemma r_triangle: "eval r_triangle [n] \<down>= Sum {0..n}"
+proof -
+  let ?r = "r_dummy 1 (Cn 2 S [r_add])"
+  have "eval ?r [x, y, z] \<down>= Suc (x + y)" for x y z
+    using r_dummy_append[of "Cn 2 S [r_add]" "[x, y]" "[z]" 1] by simp
+  then have "eval (Pr 1 Z ?r) [x, y] \<down>= Sum {0..x}" for x y
+    by (induction x) simp_all
+  then show ?thesis unfolding r_triangle_def by simp
+qed
+
+lemma r_triangle_eq_triangle [simp]: "eval r_triangle [n] \<down>= triangle n"
+  using r_triangle gauss_sum_nat triangle_def by simp
+
+definition "r_prod_encode \<equiv> Cn 2 r_add [Cn 2 r_triangle [r_add], Id 2 0]"
+
+lemma r_prod_encode_prim [simp]: "prim_recfn 2 r_prod_encode"
+  unfolding r_prod_encode_def using r_triangle_prim by simp
+
+lemma r_prod_encode [simp]: "eval r_prod_encode [m, n] \<down>= prod_encode (m, n)"
+  unfolding r_prod_encode_def prod_encode_def using r_triangle_prim by simp
+
+text \<open>These abbreviations are just two more things borrowed from
+Xu~et~al.~\cite{Universal_Turing_Machine-AFP}.\<close>
+
+abbreviation "pdec1 z \<equiv> fst (prod_decode z)"
+
+abbreviation "pdec2 z \<equiv> snd (prod_decode z)"
+
+lemma pdec1_le: "pdec1 i \<le> i"
+  by (metis le_prod_encode_1 prod.collapse prod_decode_inverse)
+
+lemma pdec2_le: "pdec2 i \<le> i"
+  by (metis le_prod_encode_2 prod.collapse prod_decode_inverse)
+
+lemma pdec_less: "pdec2 i < Suc i"
+  using pdec2_le by (simp add: le_imp_less_Suc)
+
+lemma pdec1_zero: "pdec1 0 = 0"
+  using pdec1_le by auto
+
+definition "r_maxletr \<equiv>
+  Pr 1 Z (Cn 3 r_ifle [r_dummy 2 (Cn 1 r_triangle [S]), Id 3 2, Cn 3 S [Id 3 0], Id 3 1])"
+
+lemma r_maxletr_prim: "prim_recfn 2 r_maxletr"
+  unfolding r_maxletr_def using r_triangle_prim by simp
+
+lemma not_Suc_Greatest_not_Suc:
+  assumes "\<not> P (Suc x)" and "\<exists>x. P x"
+  shows "(GREATEST y. y \<le> x \<and> P y) = (GREATEST y. y \<le> Suc x \<and> P y)"
+  using assms by (metis le_SucI le_Suc_eq)
+
+lemma r_maxletr: "eval r_maxletr [x\<^sub>0, x\<^sub>1] \<down>= (GREATEST y. y \<le> x\<^sub>0 \<and> triangle y \<le> x\<^sub>1)"
+proof -
+  let ?g = "Cn 3 r_ifle [r_dummy 2 (Cn 1 r_triangle [S]), Id 3 2, Cn 3 S [Id 3 0], Id 3 1]"
+  have greatest:
+    "(if triangle (Suc x\<^sub>0) \<le> x\<^sub>1 then Suc x\<^sub>0 else (GREATEST y. y \<le> x\<^sub>0 \<and> triangle y \<le> x\<^sub>1)) =
+     (GREATEST y. y \<le> Suc x\<^sub>0 \<and> triangle y \<le> x\<^sub>1)"
+    for x\<^sub>0 x\<^sub>1
+  proof (cases "triangle (Suc x\<^sub>0) \<le> x\<^sub>1")
+    case True
+    then show ?thesis
+      using Greatest_equality[of "\<lambda>y. y \<le> Suc x\<^sub>0 \<and> triangle y \<le> x\<^sub>1"] by fastforce
+  next
+    case False
+    then show ?thesis
+      using not_Suc_Greatest_not_Suc[of "\<lambda>y. triangle y \<le> x\<^sub>1" x\<^sub>0] by fastforce
+  qed
+  show ?thesis
+    unfolding r_maxletr_def using r_triangle_prim 
+  proof (induction x\<^sub>0)
+    case 0
+    then show ?case
+      using Greatest_equality[of "\<lambda>y. y \<le> 0 \<and> triangle y \<le> x\<^sub>1" 0] by simp
+  next
+    case (Suc x\<^sub>0)
+    then show ?case using greatest by simp
+  qed
+qed
+
+definition "r_maxlt \<equiv> r_shrink r_maxletr"
+
+lemma r_maxlt_prim: "prim_recfn 1 r_maxlt"
+  unfolding r_maxlt_def using r_maxletr_prim by simp
+
+lemma r_maxlt: "eval r_maxlt [e] \<down>= (GREATEST y. triangle y \<le> e)"
+proof -
+  have "y \<le> triangle y" for y
+    by (induction y) auto
+  then have "triangle y \<le> e \<Longrightarrow> y \<le> e" for y e
+    using order_trans by blast
+  then have "(GREATEST y. y \<le> e \<and> triangle y \<le> e) = (GREATEST y. triangle y \<le> e)"
+    by metis
+  moreover have "eval r_maxlt [e] \<down>= (GREATEST y. y \<le> e \<and> triangle y \<le> e)"
+    using r_maxletr r_shrink r_maxlt_def r_maxletr_prim by fastforce
+  ultimately show ?thesis by simp
+qed
+
+definition "pdec1' e \<equiv> e - triangle (GREATEST y. triangle y \<le> e)"
+
+definition "pdec2' e \<equiv> (GREATEST y. triangle y \<le> e) - pdec1' e"
+
+lemma max_triangle_bound: "triangle z \<le> e \<Longrightarrow> z \<le> e"
+  by (metis Suc_pred add_leD2 less_Suc_eq triangle_Suc zero_le zero_less_Suc)
+
+lemma triangle_greatest_le: "triangle (GREATEST y. triangle y \<le> e) \<le> e"
+  using max_triangle_bound GreatestI_nat[of "\<lambda>y. triangle y \<le> e" 0 e] by simp
+
+lemma prod_encode_pdec': "prod_encode (pdec1' e, pdec2' e) = e"
+proof -
+  let ?P = "\<lambda>y. triangle y \<le> e"
+  let ?y = "GREATEST y. ?P y"
+  have "pdec1' e \<le> ?y"
+  proof (rule ccontr)
+    assume "\<not> pdec1' e \<le> ?y"
+    then have "e - triangle ?y > ?y"
+      using pdec1'_def by simp
+    then have "?P (Suc ?y)" by simp
+    moreover have "\<forall>z. ?P z \<longrightarrow> z \<le> e"
+      using max_triangle_bound by simp
+    ultimately have "Suc ?y \<le> ?y"
+      using Greatest_le_nat[of ?P "Suc ?y" e] by blast
+    then show False by simp
+  qed
+  then have "pdec1' e + pdec2' e = ?y"
+    using pdec1'_def pdec2'_def by simp
+  then have "prod_encode (pdec1' e, pdec2' e) = triangle ?y + pdec1' e"
+    by (simp add: prod_encode_def)
+  then show ?thesis using pdec1'_def triangle_greatest_le by simp
+qed
+
+lemma pdec':
+  "pdec1' e = pdec1 e"
+  "pdec2' e = pdec2 e"
+  using prod_encode_pdec' prod_encode_inverse by (metis fst_conv, metis snd_conv)
+
+definition "r_pdec1 \<equiv> Cn 1 r_sub [Id 1 0, Cn 1 r_triangle [r_maxlt]]"
+
+lemma r_pdec1_prim [simp]: "prim_recfn 1 r_pdec1"
+  unfolding r_pdec1_def using r_triangle_prim r_maxlt_prim by simp
+
+lemma r_pdec1 [simp]: "eval r_pdec1 [e] \<down>= pdec1 e"
+  unfolding r_pdec1_def using r_triangle_prim r_maxlt_prim pdec' pdec1'_def
+  by (simp add: r_maxlt)
+
+definition "r_pdec2 \<equiv> Cn 1 r_sub [r_maxlt, r_pdec1]"
+
+lemma r_pdec2_prim [simp]: "prim_recfn 1 r_pdec2"
+  unfolding r_pdec2_def using r_maxlt_prim by simp
+
+lemma r_pdec2 [simp]: "eval r_pdec2 [e] \<down>= pdec2 e"
+  unfolding r_pdec2_def using r_maxlt_prim r_maxlt pdec' pdec2'_def by simp
+
+abbreviation "pdec12 i \<equiv> pdec1 (pdec2 i)"
+abbreviation "pdec22 i \<equiv> pdec2 (pdec2 i)"
+abbreviation "pdec122 i \<equiv> pdec1 (pdec22 i)"
+abbreviation "pdec222 i \<equiv> pdec2 (pdec22 i)"
+
+definition "r_pdec12 \<equiv> Cn 1 r_pdec1 [r_pdec2]"
+
+lemma r_pdec12_prim [simp]: "prim_recfn 1 r_pdec12"
+  unfolding r_pdec12_def by simp
+
+lemma r_pdec12 [simp]: "eval r_pdec12 [e] \<down>= pdec12 e"
+  unfolding r_pdec12_def by simp
+
+definition "r_pdec22 \<equiv> Cn 1 r_pdec2 [r_pdec2]"
+
+lemma r_pdec22_prim [simp]: "prim_recfn 1 r_pdec22"
+  unfolding r_pdec22_def by simp
+
+lemma r_pdec22 [simp]: "eval r_pdec22 [e] \<down>= pdec22 e"
+  unfolding r_pdec22_def by simp
+
+definition "r_pdec122 \<equiv> Cn 1 r_pdec1 [r_pdec22]"
+
+lemma r_pdec122_prim [simp]: "prim_recfn 1 r_pdec122"
+  unfolding r_pdec122_def by simp
+
+lemma r_pdec122 [simp]: "eval r_pdec122 [e] \<down>= pdec122 e"
+  unfolding r_pdec122_def by simp
+
+definition "r_pdec222 \<equiv> Cn 1 r_pdec2 [r_pdec22]"
+
+lemma r_pdec222_prim [simp]: "prim_recfn 1 r_pdec222"
+  unfolding r_pdec222_def by simp
+
+lemma r_pdec222 [simp]: "eval r_pdec222 [e] \<down>= pdec222 e"
+  unfolding r_pdec222_def by simp
+
+
+subsubsection \<open>The Cantor tuple function\<close>
+
+text \<open>The empty tuple gets no code, whereas singletons are encoded by their
+only element and other tuples by recursively applying the pairing function.
+This yields, for every $n$, the function @{term "tuple_encode n"}, which is a
+bijection between the natural numbers and the lists of length $(n + 1)$.\<close>
+
+fun tuple_encode :: "nat \<Rightarrow> nat list \<Rightarrow> nat" where
+  "tuple_encode n [] = undefined"
+| "tuple_encode 0 (x # xs) = x"
+| "tuple_encode (Suc n) (x # xs) = prod_encode (x, tuple_encode n xs)"
+
+lemma tuple_encode_prod_encode: "tuple_encode 1 [x, y] = prod_encode (x, y)"
+  by simp
+
+fun tuple_decode where
+  "tuple_decode 0 i = [i]"
+| "tuple_decode (Suc n) i = pdec1 i # tuple_decode n (pdec2 i)"
+
+lemma tuple_encode_decode [simp]:
+  "tuple_encode (length xs - 1) (tuple_decode (length xs - 1) i) = i"
+proof (induction "length xs - 1" arbitrary: xs i)
+  case 0
+  then show ?case by simp
+next
+  case (Suc n)
+  then have "length xs - 1 > 0" by simp
+  with Suc have *: "tuple_encode n (tuple_decode n j) = j" for j
+    by (metis diff_Suc_1 length_tl)
+  from Suc have "tuple_decode (Suc n) i = pdec1 i # tuple_decode n (pdec2 i)"
+    using tuple_decode.simps(2) by blast
+  then have "tuple_encode (Suc n) (tuple_decode (Suc n) i) =
+      tuple_encode (Suc n) (pdec1 i # tuple_decode n (pdec2 i))"
+    using Suc by simp
+  also have "... = prod_encode (pdec1 i, tuple_encode n (tuple_decode n (pdec2 i)))"
+    by simp
+  also have "... = prod_encode (pdec1 i, pdec2 i)"
+    using Suc * by simp
+  also have "... = i" by simp
+  finally have "tuple_encode (Suc n) (tuple_decode (Suc n) i) = i" .
+  then show ?case by (simp add: Suc.hyps(2))
+qed
+
+lemma tuple_encode_decode' [simp]: "tuple_encode n (tuple_decode n i) = i"
+  using tuple_encode_decode by (metis Ex_list_of_length diff_Suc_1 length_Cons)
+
+lemma tuple_decode_encode:
+  assumes "length xs > 0"
+  shows "tuple_decode (length xs - 1) (tuple_encode (length xs - 1) xs) = xs"
+  using assms
+proof (induction "length xs - 1" arbitrary: xs)
+  case 0
+  moreover from this have "length xs = 1" by linarith
+  ultimately show ?case
+    by (metis One_nat_def length_0_conv length_Suc_conv tuple_decode.simps(1)
+      tuple_encode.simps(2))
+next
+  case (Suc n)
+  let ?t = "tl xs"
+  let ?i = "tuple_encode (Suc n) xs"
+  have "length ?t > 0" and "length ?t - 1 = n"
+    using Suc by simp_all
+  then have "tuple_decode n (tuple_encode n ?t) = ?t"
+    using Suc by blast
+  moreover have "?i = prod_encode (hd xs, tuple_encode n ?t)"
+    using Suc by (metis hd_Cons_tl length_greater_0_conv tuple_encode.simps(3))
+  moreover have "tuple_decode (Suc n) ?i = pdec1 ?i # tuple_decode n (pdec2 ?i)"
+    using tuple_decode.simps(2) by blast
+  ultimately have "tuple_decode (Suc n) ?i = xs"
+    using Suc.prems by simp
+  then show ?case by (simp add: Suc.hyps(2))
+qed
+
+lemma tuple_decode_encode' [simp]:
+  assumes "length xs = Suc n"
+  shows "tuple_decode n (tuple_encode n xs) = xs"
+  using assms tuple_decode_encode by (metis diff_Suc_1 zero_less_Suc)
+
+lemma tuple_decode_length [simp]: "length (tuple_decode n i) = Suc n"
+  by (induction n arbitrary: i) simp_all
+
+lemma tuple_decode_nonzero:
+  assumes "n > 0"
+  shows "tuple_decode n i = pdec1 i # tuple_decode (n - 1) (pdec2 i)"
+  using assms by (metis One_nat_def Suc_pred tuple_decode.simps(2))
+
+text \<open>The tuple encoding functions are primitive recursive.\<close>
+
+fun r_tuple_encode :: "nat \<Rightarrow> recf" where
+  "r_tuple_encode 0 = Id 1 0"
+| "r_tuple_encode (Suc n) =
+     Cn (Suc (Suc n)) r_prod_encode [Id (Suc (Suc n)) 0, r_shift (r_tuple_encode n)]"
+
+lemma r_tuple_encode_prim [simp]: "prim_recfn (Suc n) (r_tuple_encode n)"
+  by (induction n) simp_all
+
+lemma r_tuple_encode:
+  assumes "length xs = Suc n"
+  shows "eval (r_tuple_encode n) xs \<down>= tuple_encode n xs"
+  using assms
+proof (induction n arbitrary: xs)
+  case 0
+  then show ?case
+    by (metis One_nat_def eval_Id length_Suc_conv nth_Cons_0
+      r_tuple_encode.simps(1) tuple_encode.simps(2) zero_less_one)
+next
+  case (Suc n)
+  then obtain y ys where y_ys: "y # ys = xs"
+    by (metis length_Suc_conv)
+  with Suc have "eval (r_tuple_encode n) ys \<down>= tuple_encode n ys"
+    by auto
+  with y_ys have "eval (r_shift (r_tuple_encode n)) xs \<down>= tuple_encode n ys"
+    using Suc.prems r_shift_prim r_tuple_encode_prim by auto
+  moreover have "eval (Id (Suc (Suc n)) 0) xs \<down>= y"
+    using y_ys Suc.prems by auto
+  ultimately have "eval (r_tuple_encode (Suc n)) xs \<down>= prod_encode (y, tuple_encode n ys)"
+    using Suc.prems by simp
+  then show ?case using y_ys by auto
+qed
+
+
+subsubsection \<open>Functions on encoded tuples\<close>
+
+text \<open>The function for accessing the $n$-th element of a tuple returns
+$0$ for out-of-bounds access.\<close>
+
+definition e_tuple_nth :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_tuple_nth a i n \<equiv> if n \<le> a then (tuple_decode a i) ! n else 0"
+
+lemma e_tuple_nth_le [simp]: "n \<le> a \<Longrightarrow> e_tuple_nth a i n = (tuple_decode a i) ! n"
+  using e_tuple_nth_def by simp
+
+lemma e_tuple_nth_gr [simp]: "n > a \<Longrightarrow> e_tuple_nth a i n = 0"
+  using e_tuple_nth_def by simp
+
+lemma tuple_decode_pdec2: "tuple_decode a (pdec2 es) = tl (tuple_decode (Suc a) es)"
+  by simp
+
+fun iterate :: "nat \<Rightarrow> ('a \<Rightarrow> 'a) \<Rightarrow> ('a \<Rightarrow> 'a)" where
+  "iterate 0 f = id"
+| "iterate (Suc n) f = f \<circ> (iterate n f)"
+
+lemma iterate_additive:
+  assumes "iterate t\<^sub>1 f x = y" and "iterate t\<^sub>2 f y = z"
+  shows "iterate (t\<^sub>1 + t\<^sub>2) f x = z"
+  using assms by (induction t\<^sub>2 arbitrary: z) auto
+
+lemma iterate_additive': "iterate (t\<^sub>1 + t\<^sub>2) f x = iterate t\<^sub>2 f (iterate t\<^sub>1 f x)"
+  using iterate_additive by metis
+
+lemma e_tuple_nth_elementary:
+  assumes "k \<le> a"
+  shows "e_tuple_nth a i k = (if a = k then (iterate k pdec2 i) else (pdec1 (iterate k pdec2 i)))"
+proof -
+  have *: "tuple_decode (a - k) (iterate k pdec2 i) = drop k (tuple_decode a i)"
+    using assms
+    by (induction k) (simp, simp add: Suc_diff_Suc tuple_decode_pdec2 drop_Suc tl_drop)
+  show ?thesis
+  proof (cases "a = k")
+    case True
+    then have "tuple_decode 0 (iterate k pdec2 i) = drop k (tuple_decode a i)"
+      using assms * by simp
+    moreover from this have "drop k (tuple_decode a i) = [tuple_decode a i ! k]"
+      using assms True by (metis nth_via_drop tuple_decode.simps(1))
+    ultimately show ?thesis using True by simp
+  next
+    case False
+    with assms have "a - k > 0" by simp
+    with * have "tuple_decode (a - k) (iterate k pdec2 i) = drop k (tuple_decode a i)"
+      by simp
+    then have "pdec1 (iterate k pdec2 i) = hd (drop k (tuple_decode a i))"
+      using tuple_decode_nonzero `a - k > 0` by (metis list.sel(1))
+    with `a - k > 0` have "pdec1 (iterate k pdec2 i) = (tuple_decode a i) ! k"
+      by (simp add: hd_drop_conv_nth)
+    with False assms show ?thesis by simp
+  qed
+qed
+
+definition "r_nth_inbounds \<equiv>
+  let r = Pr 1 (Id 1 0) (Cn 3 r_pdec2 [Id 3 1])
+  in Cn 3 r_ifeq
+       [Id 3 0,
+        Id 3 2,
+        Cn 3 r [Id 3 2, Id 3 1],
+        Cn 3 r_pdec1 [Cn 3 r [Id 3 2, Id 3 1]]]"
+
+lemma r_nth_inbounds_prim: "prim_recfn 3 r_nth_inbounds"
+  unfolding r_nth_inbounds_def by (simp add: Let_def)
+
+lemma r_nth_inbounds:
+  "k \<le> a \<Longrightarrow> eval r_nth_inbounds [a, i, k] \<down>= e_tuple_nth a i k"
+  "eval r_nth_inbounds [a, i, k] \<down>"
+proof -
+  let ?r = "Pr 1 (Id 1 0) (Cn 3 r_pdec2 [Id 3 1])"
+  let ?h = "Cn 3 ?r [Id 3 2, Id 3 1]"
+  have "eval ?r [k, i] \<down>= iterate k pdec2 i" for k i
+    using r_pdec2_prim by (induction k) (simp_all)
+  then have "eval ?h [a, i, k] \<down>= iterate k pdec2 i"
+    using r_pdec2_prim by simp
+  then have "eval r_nth_inbounds [a, i, k] \<down>=
+      (if a = k then iterate k pdec2 i else pdec1 (iterate k pdec2 i))"
+    unfolding r_nth_inbounds_def by (simp add: Let_def)
+  then show "k \<le> a \<Longrightarrow> eval r_nth_inbounds [a, i, k] \<down>= e_tuple_nth a i k"
+    and "eval r_nth_inbounds [a, i, k] \<down>"
+    using e_tuple_nth_elementary by simp_all
+qed
+
+definition "r_tuple_nth \<equiv>
+  Cn 3 r_ifle [Id 3 2, Id 3 0, r_nth_inbounds, r_constn 2 0]"
+
+lemma r_tuple_nth_prim: "prim_recfn 3 r_tuple_nth"
+  unfolding r_tuple_nth_def using r_nth_inbounds_prim by simp
+
+lemma r_tuple_nth [simp]: "eval r_tuple_nth [a, i, k] \<down>= e_tuple_nth a i k"
+  unfolding r_tuple_nth_def using r_nth_inbounds_prim r_nth_inbounds by simp
+
+
+subsection \<open>Lists\<close>
+
+
+subsubsection \<open>Encoding and decoding\<close>
+
+text \<open>Lists are encoded by pairing the length of the list with the code
+for the tuple made up of the list's elements. Then all these codes are
+incremented in order to make room for the empty list
+(cf.~Rogers~\cite[p.~71]{Rogers87}).\<close>
+
+fun list_encode :: "nat list \<Rightarrow> nat" where
+  "list_encode [] = 0"
+| "list_encode (x # xs) = Suc (prod_encode (length xs, tuple_encode (length xs) (x # xs)))"
+
+lemma list_encode_0 [simp]: "list_encode xs = 0 \<Longrightarrow> xs = []"
+  using list_encode.elims by blast
+
+lemma list_encode_1: "list_encode [0] = 1"
+  by (simp add: prod_encode_def)
+
+fun list_decode :: "nat \<Rightarrow> nat list" where
+  "list_decode 0 = []"
+| "list_decode (Suc n) = tuple_decode (pdec1 n) (pdec2 n)"
+
+lemma list_encode_decode [simp]: "list_encode (list_decode n) = n"
+proof (cases n)
+  case 0
+  then show ?thesis by simp
+next
+  case (Suc k)
+  then have *: "list_decode n = tuple_decode (pdec1 k) (pdec2 k)" (is "_ = ?t")
+    by simp
+  then obtain x xs where xxs: "x # xs = ?t"
+    by (metis tuple_decode.elims)
+  then have "list_encode ?t = list_encode (x # xs)" by simp
+  then have 1: "list_encode ?t = Suc (prod_encode (length xs, tuple_encode (length xs) (x # xs)))"
+    by simp
+  have 2: "length xs = length ?t - 1"
+    using xxs by (metis length_tl list.sel(3))
+  then have 3: "length xs = pdec1 k"
+    using * by simp
+  then have "tuple_encode (length ?t - 1) ?t = pdec2 k"
+    using 2 tuple_encode_decode by metis
+  then have "list_encode ?t = Suc (prod_encode (pdec1 k, pdec2 k))"
+    using 1 2 3 xxs by simp
+  with * Suc show ?thesis by simp
+qed
+
+lemma list_decode_encode [simp]: "list_decode (list_encode xs) = xs"
+proof (cases xs)
+  case Nil
+  then show ?thesis by simp
+next
+  case (Cons y ys)
+  then have "list_encode xs =
+      Suc (prod_encode (length ys, tuple_encode (length ys) xs))"
+      (is "_ = Suc ?i")
+    by simp
+  then have "list_decode (Suc ?i) = tuple_decode (pdec1 ?i) (pdec2 ?i)" by simp
+  moreover have "pdec1 ?i = length ys" by simp
+  moreover have "pdec2 ?i = tuple_encode (length ys) xs" by simp
+  ultimately have "list_decode (Suc ?i) =
+      tuple_decode (length ys) (tuple_encode (length ys) xs)"
+    by simp
+  moreover have "length ys = length xs - 1"
+    using Cons by simp
+  ultimately have "list_decode (Suc ?i) =
+      tuple_decode (length xs - 1) (tuple_encode (length xs - 1) xs)"
+    by simp
+  then show ?thesis using Cons by simp
+qed
+
+abbreviation singleton_encode :: "nat \<Rightarrow> nat" where
+  "singleton_encode x \<equiv> list_encode [x]"
+
+lemma list_decode_singleton: "list_decode (singleton_encode x) = [x]"
+  by simp
+
+definition "r_singleton_encode \<equiv> Cn 1 S [Cn 1 r_prod_encode [Z, Id 1 0]]"
+
+lemma r_singleton_encode_prim [simp]: "prim_recfn 1 r_singleton_encode"
+  unfolding r_singleton_encode_def by simp
+
+lemma r_singleton_encode [simp]: "eval r_singleton_encode [x] \<down>= singleton_encode x"
+  unfolding r_singleton_encode_def by simp
+
+definition r_list_encode :: "nat \<Rightarrow> recf" where
+  "r_list_encode n \<equiv> Cn (Suc n) S [Cn (Suc n) r_prod_encode [r_constn n n, r_tuple_encode n]]"
+
+lemma r_list_encode_prim [simp]: "prim_recfn (Suc n) (r_list_encode n)"
+  unfolding r_list_encode_def by simp
+
+lemma r_list_encode:
+  assumes "length xs = Suc n"
+  shows "eval (r_list_encode n) xs \<down>= list_encode xs"
+proof -
+  have "eval (r_tuple_encode n) xs \<down>"
+    by (simp add: assms r_tuple_encode)
+  then have "eval (Cn (Suc n) r_prod_encode [r_constn n n, r_tuple_encode n]) xs \<down>"
+    using assms by simp
+  then have "eval (r_list_encode n) xs =
+      eval S [the (eval (Cn (Suc n) r_prod_encode [r_constn n n, r_tuple_encode n]) xs)]"
+    unfolding r_list_encode_def using assms r_tuple_encode by simp
+  moreover from assms obtain y ys where "xs = y # ys"
+    by (meson length_Suc_conv)
+  ultimately show ?thesis
+    unfolding r_list_encode_def using assms r_tuple_encode by simp
+qed
+
+
+subsubsection \<open>Functions on encoded lists\<close>
+
+text \<open>The functions in this section mimic those on type @{typ "nat
+list"}. Their names are prefixed by @{text e_} and the names of the
+corresponding @{typ recf}s by @{text r_}.\<close>
+
+abbreviation e_tl :: "nat \<Rightarrow> nat" where
+  "e_tl e \<equiv> list_encode (tl (list_decode e))"
+
+text \<open>In order to turn @{term e_tl} into a partial recursive function
+we first represent it in a more elementary way.\<close>
+
+lemma e_tl_elementary:
+  "e_tl e =
+    (if e = 0 then 0
+     else if pdec1 (e - 1) = 0 then 0
+     else Suc (prod_encode (pdec1 (e - 1) - 1, pdec22 (e - 1))))"
+proof (cases e)
+  case 0
+  then show ?thesis by simp
+next
+  case Suc_d: (Suc d)
+  then show ?thesis
+  proof (cases "pdec1 d")
+    case 0
+    then show ?thesis using Suc_d by simp
+  next
+    case (Suc a)
+    have *: "list_decode e = tuple_decode (pdec1 d) (pdec2 d)"
+      using Suc_d by simp
+    with Suc obtain x xs where xxs: "list_decode e = x # xs" by simp
+    then have **: "e_tl e = list_encode xs" by simp
+    have "list_decode (Suc (prod_encode (pdec1 (e - 1) - 1, pdec22 (e - 1)))) =
+        tuple_decode (pdec1 (e - 1) - 1) (pdec22 (e - 1))"
+        (is "?lhs = _")
+      by simp
+    also have "... = tuple_decode a (pdec22 (e - 1))"
+      using Suc Suc_d by simp
+    also have "... = tl (tuple_decode (Suc a) (pdec2 (e - 1)))"
+      using tuple_decode_pdec2 Suc by presburger
+    also have "... = tl (tuple_decode (pdec1 (e - 1)) (pdec2 (e - 1)))"
+      using Suc Suc_d by auto
+    also have "... = tl (list_decode e)"
+      using * Suc_d by simp
+    also have "... = xs"
+      using xxs by simp
+    finally have "?lhs = xs" .
+    then have "list_encode ?lhs = list_encode xs" by simp
+    then have "Suc (prod_encode (pdec1 (e - 1) - 1, pdec22 (e - 1))) = list_encode xs"
+      using list_encode_decode by metis
+    then show ?thesis using ** Suc_d Suc by simp
+  qed
+qed
+
+definition "r_tl \<equiv>
+ let r = Cn 1 r_pdec1 [r_dec]
+ in Cn 1 r_ifz
+     [Id 1 0,
+      Z,
+      Cn 1 r_ifz
+       [r, Z, Cn 1 S [Cn 1 r_prod_encode [Cn 1 r_dec [r], Cn 1 r_pdec22 [r_dec]]]]]"
+
+lemma r_tl_prim [simp]: "prim_recfn 1 r_tl"
+  unfolding r_tl_def by (simp add: Let_def)
+
+lemma r_tl [simp]: "eval r_tl [e] \<down>= e_tl e"
+  unfolding r_tl_def using e_tl_elementary by (simp add: Let_def)
+
+text \<open>We define the head of the empty encoded list to be zero.\<close>
+
+definition e_hd :: "nat \<Rightarrow> nat" where
+  "e_hd e \<equiv> if e = 0 then 0 else hd (list_decode e)"
+
+lemma e_hd [simp]:
+  assumes "list_decode e = x # xs"
+  shows "e_hd e = x"
+  using e_hd_def assms by auto
+
+lemma e_hd_0 [simp]: "e_hd 0 = 0"
+  using e_hd_def by simp
+
+lemma e_hd_neq_0 [simp]:
+  assumes "e \<noteq> 0"
+  shows "e_hd e = hd (list_decode e)"
+  using e_hd_def assms by simp
+
+definition "r_hd \<equiv>
+  Cn 1 r_ifz [Cn 1 r_pdec1 [r_dec], Cn 1 r_pdec2 [r_dec], Cn 1 r_pdec12 [r_dec]]"
+
+lemma r_hd_prim [simp]: "prim_recfn 1 r_hd"
+  unfolding r_hd_def by simp
+
+lemma r_hd [simp]: "eval r_hd [e] \<down>= e_hd e"
+proof -
+  have "e_hd e = (if pdec1 (e - 1) = 0 then pdec2 (e - 1) else pdec12 (e - 1))"
+  proof (cases e)
+    case 0
+    then show ?thesis using pdec1_zero pdec2_le by auto
+  next
+    case (Suc d)
+    then show ?thesis by (cases "pdec1 d") (simp_all add: pdec1_zero)
+  qed
+  then show ?thesis unfolding r_hd_def by simp
+qed
+
+abbreviation e_length :: "nat \<Rightarrow> nat" where
+  "e_length e \<equiv> length (list_decode e)"
+
+lemma e_length_0: "e_length e = 0 \<Longrightarrow> e = 0"
+  by (metis list_encode.simps(1) length_0_conv list_encode_decode)
+
+definition "r_length \<equiv> Cn 1 r_ifz [Id 1 0, Z, Cn 1 S [Cn 1 r_pdec1 [r_dec]]]"
+
+lemma r_length_prim [simp]: "prim_recfn 1 r_length"
+  unfolding r_length_def by simp
+
+lemma r_length [simp]: "eval r_length [e] \<down>= e_length e"
+  unfolding r_length_def by (cases e) simp_all
+
+text \<open>Accessing an encoded list out of bounds yields zero.\<close>
+
+definition e_nth :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_nth e n \<equiv> if e = 0 then 0 else e_tuple_nth (pdec1 (e - 1)) (pdec2 (e - 1)) n"
+
+lemma e_nth [simp]:
+  "e_nth e n = (if n < e_length e then (list_decode e) ! n else 0)"
+  by (cases e) (simp_all add: e_nth_def e_tuple_nth_def)
+
+lemma e_hd_nth0: "e_hd e = e_nth e 0"
+  by (simp add: e_hd_def e_length_0 hd_conv_nth)
+
+definition "r_nth \<equiv>
+  Cn 2 r_ifz
+   [Id 2 0,
+    r_constn 1 0,
+    Cn 2 r_tuple_nth
+     [Cn 2 r_pdec1 [r_dummy 1 r_dec], Cn 2 r_pdec2 [r_dummy 1 r_dec], Id 2 1]]"
+
+lemma r_nth_prim [simp]: "prim_recfn 2 r_nth"
+  unfolding r_nth_def using r_tuple_nth_prim by simp
+
+lemma r_nth [simp]: "eval r_nth [e, n] \<down>= e_nth e n"
+  unfolding r_nth_def e_nth_def using r_tuple_nth_prim by simp
+
+definition "r_rev_aux \<equiv>
+  Pr 1 r_hd (Cn 3 r_prod_encode [Cn 3 r_nth [Id 3 2, Cn 3 S [Id 3 0]], Id 3 1])"
+
+lemma r_rev_aux_prim: "prim_recfn 2 r_rev_aux"
+  unfolding r_rev_aux_def by simp
+
+lemma r_rev_aux:
+  assumes "list_decode e = xs" and "length xs > 0" and "i < length xs"
+  shows "eval r_rev_aux [i, e] \<down>= tuple_encode i (rev (take (Suc i) xs))"
+  using assms(3)
+proof (induction i)
+  case 0
+  then show ?case
+    unfolding r_rev_aux_def using assms e_hd_def r_hd by (auto simp add: take_Suc)
+next
+  case (Suc i)
+  let ?g = "Cn 3 r_prod_encode [Cn 3 r_nth [Id 3 2, Cn 3 S [Id 3 0]], Id 3 1]"
+  from Suc have "eval r_rev_aux [Suc i, e] = eval ?g [i, the (eval r_rev_aux [i, e]), e]"
+    unfolding r_rev_aux_def by simp
+  also have "... \<down>= prod_encode (xs ! (Suc i), tuple_encode i (rev (take (Suc i) xs)))"
+    using Suc by (simp add: assms(1))
+  finally show ?case by (simp add: Suc.prems take_Suc_conv_app_nth)
+qed
+
+corollary r_rev_aux_full:
+  assumes "list_decode e = xs" and "length xs > 0"
+  shows "eval r_rev_aux [length xs - 1, e] \<down>= tuple_encode (length xs - 1) (rev xs)"
+  using r_rev_aux assms by simp
+
+lemma r_rev_aux_total: "eval r_rev_aux [i, e] \<down>"
+  using r_rev_aux_prim totalE by fastforce
+
+definition "r_rev \<equiv>
+  Cn 1 r_ifz
+   [Id 1 0,
+    Z,
+    Cn 1 S
+     [Cn 1 r_prod_encode
+      [Cn 1 r_dec [r_length], Cn 1 r_rev_aux [Cn 1 r_dec [r_length], Id 1 0]]]]"
+
+lemma r_rev_prim [simp]: "prim_recfn 1 r_rev"
+  unfolding r_rev_def using r_rev_aux_prim by simp
+
+lemma r_rev [simp]: "eval r_rev [e] \<down>= list_encode (rev (list_decode e))"
+proof -
+  let ?d = "Cn 1 r_dec [r_length]"
+  let ?a = "Cn 1 r_rev_aux [?d, Id 1 0]"
+  let ?p = "Cn 1 r_prod_encode [?d, ?a]"
+  let ?s = "Cn 1 S [?p]"
+  have eval_a: "eval ?a [e] = eval r_rev_aux [e_length e - 1, e]"
+    using r_rev_aux_prim by simp
+  then have "eval ?s [e] \<down>"
+    using r_rev_aux_prim by (simp add: r_rev_aux_total)
+  then have *: "eval r_rev [e] \<down>= (if e = 0 then 0 else the (eval ?s [e]))"
+    using r_rev_aux_prim by (simp add: r_rev_def)
+  show ?thesis
+  proof (cases "e = 0")
+    case True
+    then show ?thesis using * by simp
+  next
+    case False
+    then obtain xs where xs: "xs = list_decode e" "length xs > 0"
+      using e_length_0 by auto
+    then have len: "length xs = e_length e" by simp
+    with eval_a have "eval ?a [e] = eval r_rev_aux [length xs - 1, e]"
+      by simp
+    then have "eval ?a [e] \<down>= tuple_encode (length xs - 1) (rev xs)"
+      using xs r_rev_aux_full by simp
+    then have "eval ?s [e] \<down>=
+        Suc (prod_encode (length xs - 1, tuple_encode (length xs - 1) (rev xs)))"
+      using len r_rev_aux_prim by simp
+    then have "eval ?s [e] \<down>=
+        Suc (prod_encode
+              (length (rev xs) - 1, tuple_encode (length (rev xs) - 1) (rev xs)))"
+      by simp
+    moreover have "length (rev xs) > 0"
+      using xs by simp
+    ultimately have "eval ?s [e] \<down>= list_encode (rev xs)"
+      by (metis list_encode.elims diff_Suc_1 length_Cons length_greater_0_conv)
+    then show ?thesis using xs * by simp
+  qed
+qed
+
+abbreviation e_cons :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_cons e es \<equiv> list_encode (e # list_decode es)"
+
+lemma e_cons_elementary:
+  "e_cons e es =
+    (if es = 0 then Suc (prod_encode (0, e))
+     else Suc (prod_encode (e_length es, prod_encode (e, pdec2 (es - 1)))))"
+proof (cases "es = 0")
+  case True
+  then show ?thesis by simp
+next
+  case False
+  then have "e_length es = Suc (pdec1 (es - 1))"
+    by (metis list_decode.elims diff_Suc_1 tuple_decode_length)
+  moreover have "es = e_tl (list_encode (e # list_decode es))"
+    by (metis list.sel(3) list_decode_encode list_encode_decode)
+  ultimately show ?thesis
+    using False e_tl_elementary 
+    by (metis list_decode.simps(2) diff_Suc_1 list_encode_decode prod.sel(1)
+      prod_encode_inverse snd_conv tuple_decode.simps(2))
+qed
+
+definition "r_cons_else \<equiv>
+  Cn 2 S
+   [Cn 2 r_prod_encode
+     [Cn 2 r_length
+       [Id 2 1], Cn 2 r_prod_encode [Id 2 0, Cn 2 r_pdec2 [Cn 2 r_dec [Id 2 1]]]]]"
+
+lemma r_cons_else_prim: "prim_recfn 2 r_cons_else"
+  unfolding r_cons_else_def by simp
+
+lemma r_cons_else:
+  "eval r_cons_else [e, es] \<down>=
+    Suc (prod_encode (e_length es, prod_encode (e, pdec2 (es - 1))))"
+  unfolding r_cons_else_def by simp
+
+definition "r_cons \<equiv>
+  Cn 2 r_ifz
+    [Id 2 1, Cn 2 S [Cn 2 r_prod_encode [r_constn 1 0, Id 2 0]], r_cons_else]"
+
+lemma r_cons_prim [simp]: "prim_recfn 2 r_cons"
+  unfolding r_cons_def using r_cons_else_prim by simp
+
+lemma r_cons [simp]: "eval r_cons [e, es] \<down>= e_cons e es"
+  unfolding r_cons_def using r_cons_else_prim r_cons_else e_cons_elementary by simp
+
+abbreviation e_snoc :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_snoc es e \<equiv> list_encode (list_decode es @ [e])"
+
+lemma e_nth_snoc_small [simp]:
+  assumes "n < e_length b"
+  shows "e_nth (e_snoc b z) n = e_nth b n"
+  using assms by (simp add: nth_append)
+
+lemma e_hd_snoc [simp]:
+  assumes "e_length b > 0"
+  shows "e_hd (e_snoc b x) = e_hd b"
+proof -
+  from assms have "b \<noteq> 0"
+    using less_imp_neq by force
+  then have hd: "e_hd b = hd (list_decode b)" by simp
+  have "e_length (e_snoc b x) > 0" by simp
+  then have "e_snoc b x \<noteq> 0"
+    using not_gr_zero by fastforce
+  then have "e_hd (e_snoc b x) = hd (list_decode (e_snoc b x))" by simp
+  with assms hd show ?thesis by simp
+qed
+
+definition "r_snoc \<equiv> Cn 2 r_rev [Cn 2 r_cons [Id 2 1, Cn 2 r_rev [Id 2 0]]]"
+
+lemma r_snoc_prim [simp]: "prim_recfn 2 r_snoc"
+  unfolding r_snoc_def by simp
+
+lemma r_snoc [simp]: "eval r_snoc [es, e] \<down>= e_snoc es e"
+  unfolding r_snoc_def by simp
+
+abbreviation e_butlast :: "nat \<Rightarrow> nat" where
+  "e_butlast e \<equiv> list_encode (butlast (list_decode e))"
+
+abbreviation e_take :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_take n x \<equiv> list_encode (take n (list_decode x))"
+
+definition "r_take \<equiv>
+  Cn 2 r_ifle
+   [Id 2 0, Cn 2 r_length [Id 2 1],
+    Pr 1 Z (Cn 3 r_snoc [Id 3 1, Cn 3 r_nth [Id 3 2, Id 3 0]]),
+    Id 2 1]"
+
+lemma r_take_prim [simp]: "prim_recfn 2 r_take"
+  unfolding r_take_def by simp_all
+
+lemma r_take:
+  assumes "x = list_encode es"
+  shows "eval r_take [n, x] \<down>= list_encode (take n es)"
+proof -
+  let ?g = "Cn 3 r_snoc [Id 3 1, Cn 3 r_nth [Id 3 2, Id 3 0]]"
+  let ?h = "Pr 1 Z ?g"
+  have "total ?h" using Mn_free_imp_total by simp
+  have "m \<le> length es \<Longrightarrow> eval ?h [m, x] \<down>= list_encode (take m es)" for m
+  proof (induction m)
+    case 0
+    then show ?case using assms r_take_def by (simp add: r_take_def)
+  next
+    case (Suc m)
+    then have "m < length es" by simp
+    then have "eval ?h [Suc m, x] = eval ?g [m, the (eval ?h [m, x]), x]"
+      using Suc r_take_def by simp
+    also have "... = eval ?g [m, list_encode (take m es), x]"
+      using Suc by simp
+    also have "... \<down>= e_snoc (list_encode (take m es)) (es ! m)"
+      by (simp add: \<open>m < length es\<close> assms)
+    also have "... \<down>= list_encode ((take m es) @ [es ! m])"
+      using list_decode_encode by simp
+    also have "... \<down>= list_encode (take (Suc m) es)"
+      by (simp add: \<open>m < length es\<close> take_Suc_conv_app_nth)
+    finally show ?case .
+  qed
+  moreover have "eval (Id 2 1) [m, x] \<down>= list_encode (take m es)" if "m > length es" for m
+    using that assms by simp
+  moreover have "eval r_take [m, x] \<down>=
+      (if m \<le> e_length x then the (eval ?h [m, x]) else the (eval (Id 2 1) [m, x]))"
+      for m
+    unfolding r_take_def using `total ?h` by simp
+  ultimately show ?thesis unfolding r_take_def by fastforce
+qed
+
+corollary r_take' [simp]: "eval r_take [n, x] \<down>= e_take n x"
+  by (simp add: r_take)
+
+definition "r_last \<equiv> Cn 1 r_hd [r_rev]"
+
+lemma r_last_prim [simp]: "prim_recfn 1 r_last"
+  unfolding r_last_def by simp
+
+lemma r_last [simp]:
+  assumes "e = list_encode xs" and "length xs > 0"
+  shows "eval r_last [e] \<down>= last xs"
+proof -
+  from assms(2) have "length (rev xs) > 0" by simp
+  then have "list_encode (rev xs) > 0"
+    by (metis gr0I list.size(3) list_encode_0)
+  moreover have "eval r_last [e] = eval r_hd [the (eval r_rev [e])]"
+    unfolding r_last_def by simp
+  ultimately show ?thesis using assms hd_rev by auto
+qed
+
+definition "r_update_aux \<equiv>
+  let
+    f = r_constn 2 0;
+    g = Cn 5 r_snoc
+         [Id 5 1, Cn 5 r_ifeq [Id 5 0, Id 5 3, Id 5 4, Cn 5 r_nth [Id 5 2, Id 5 0]]]
+  in Pr 3 f g"
+
+lemma r_update_aux_recfn: "recfn 4 r_update_aux"
+  unfolding r_update_aux_def by simp
+
+lemma r_update_aux:
+  assumes "n \<le> e_length b"
+  shows "eval r_update_aux [n, b, j, v] \<down>= list_encode ((take n (list_decode b))[j:=v])"
+  using assms
+proof (induction n)
+  case 0
+    then show ?case unfolding r_update_aux_def by simp
+next
+  case (Suc n)
+  then have n: "n < e_length b"
+    by simp
+  let ?a = "Cn 5 r_nth [Id 5 2, Id 5 0]"
+  let ?b = "Cn 5 r_ifeq [Id 5 0, Id 5 3, Id 5 4, ?a]"
+  define g where "g \<equiv> Cn 5 r_snoc [Id 5 1, ?b]"
+  then have g: "eval g [n, r, b, j, v] \<down>= e_snoc r (if n = j then v else e_nth b n)" for r
+    by simp
+
+  have "Pr 3 (r_constn 2 0) g = r_update_aux"
+    using r_update_aux_def g_def by simp
+  then have "eval r_update_aux [Suc n, b, j, v] =
+      eval g [n, the (eval r_update_aux [n, b, j, v]), b, j, v]"
+    using r_update_aux_recfn Suc n eval_Pr_converg_Suc
+    by (metis arity.simps(5) length_Cons list.size(3) nat_less_le
+      numeral_3_eq_3 option.simps(3))
+  then have *: "eval r_update_aux [Suc n, b, j, v] \<down>= e_snoc
+      (list_encode ((take n (list_decode b))[j:=v]))
+      (if n = j then v else e_nth b n)"
+    using g Suc by simp
+
+  consider (j_eq_n) "j = n" | (j_less_n) "j < n" | (j_gt_n) "j > n"
+    by linarith
+  then show ?case
+  proof (cases)
+    case j_eq_n
+    moreover from this have "(take (Suc n) (list_decode b))[j:=v] =
+        (take n (list_decode b))[j:=v] @ [v]"
+      using n
+      by (metis length_list_update nth_list_update_eq take_Suc_conv_app_nth take_update_swap)
+    ultimately show ?thesis using * by simp
+  next
+    case j_less_n
+    moreover from this have "(take (Suc n) (list_decode b))[j:=v] =
+        (take n (list_decode b))[j:=v] @ [(list_decode b) ! n]"
+      using n
+      by (simp add: le_eq_less_or_eq list_update_append min_absorb2 take_Suc_conv_app_nth)
+    ultimately show ?thesis using * by auto
+  next
+    case j_gt_n
+    moreover from this have "(take (Suc n) (list_decode b))[j:=v] =
+        (take n (list_decode b))[j:=v] @ [(list_decode b) ! n]"
+      using n take_Suc_conv_app_nth by auto
+    ultimately show ?thesis using * by auto
+  qed
+qed
+
+abbreviation e_update :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_update b j v \<equiv> list_encode ((list_decode b)[j:=v])"
+
+definition "r_update \<equiv>
+  Cn 3 r_update_aux [Cn 3 r_length [Id 3 0], Id 3 0, Id 3 1, Id 3 2]"
+
+lemma r_update_recfn [simp]: "recfn 3 r_update"
+  unfolding r_update_def using r_update_aux_recfn by simp
+
+lemma r_update [simp]: "eval r_update [b, j, v] \<down>= e_update b j v"
+  unfolding r_update_def using r_update_aux r_update_aux_recfn by simp
+
+lemma e_length_update [simp]: "e_length (e_update b k v) = e_length b"
+  by simp
+
+definition e_append :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_append xs ys \<equiv> list_encode (list_decode xs @ list_decode ys)"
+
+lemma e_length_append: "e_length (e_append xs ys) = e_length xs + e_length ys"
+  using e_append_def by simp
+
+lemma e_nth_append_small:
+  assumes "n < e_length xs"
+  shows "e_nth (e_append xs ys) n = e_nth xs n"
+  using e_append_def assms by (simp add: nth_append)
+
+lemma e_nth_append_big:
+  assumes "n \<ge> e_length xs"
+  shows "e_nth (e_append xs ys) n = e_nth ys (n - e_length xs)"
+  using e_append_def assms e_nth by (simp add: less_diff_conv2 nth_append)
+
+definition "r_append \<equiv>
+  let
+    f = Id 2 0;
+    g = Cn 4 r_snoc [Id 4 1, Cn 4 r_nth [Id 4 3, Id 4 0]]
+  in Cn 2 (Pr 2 f g) [Cn 2 r_length [Id 2 1], Id 2 0, Id 2 1]"
+
+lemma r_append_prim [simp]: "prim_recfn 2 r_append"
+  unfolding r_append_def by simp
+
+lemma r_append [simp]: "eval r_append [a, b] \<down>= e_append a b"
+proof -
+  define g where "g = Cn 4 r_snoc [Id 4 1, Cn 4 r_nth [Id 4 3, Id 4 0]]"
+  then have g: "eval g [j, r, a, b] \<down>= e_snoc r (e_nth b j)" for j r
+    by simp
+  let ?h = "Pr 2 (Id 2 0) g"
+  have "eval ?h [n, a, b] \<down>= list_encode (list_decode a @ (take n (list_decode b)))"
+      if "n \<le> e_length b" for n
+    using that g g_def by (induction n) (simp_all add: take_Suc_conv_app_nth)
+  then show ?thesis
+    unfolding r_append_def g_def e_append_def by simp
+qed
+
+definition e_append_zeros :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "e_append_zeros b z \<equiv> e_append b (list_encode (replicate z 0))"
+
+lemma e_append_zeros_length: "e_length (e_append_zeros b z) = e_length b + z"
+  using e_append_def e_append_zeros_def by simp
+
+lemma e_nth_append_zeros: "e_nth (e_append_zeros b z) i = e_nth b i"
+  using e_append_zeros_def e_nth_append_small e_nth_append_big by auto
+
+lemma e_nth_append_zeros_big:
+  assumes "i \<ge> e_length b"
+  shows "e_nth (e_append_zeros b z) i = 0"
+  unfolding e_append_zeros_def
+  using e_nth_append_big[of b i "list_encode (replicate z 0)", OF assms(1)]
+  by simp
+
+definition "r_append_zeros \<equiv>
+  r_swap (Pr 1 (Id 1 0) (Cn 3 r_snoc [Id 3 1, r_constn 2 0]))"
+
+lemma r_append_zeros_prim [simp]: "prim_recfn 2 r_append_zeros"
+  unfolding r_append_zeros_def by simp
+
+lemma r_append_zeros: "eval r_append_zeros [b, z] \<down>= e_append_zeros b z"
+proof -
+  let ?r = "Pr 1 (Id 1 0) (Cn 3 r_snoc [Id 3 1, r_constn 2 0])"
+  have "eval ?r [z, b] \<down>= e_append_zeros b z"
+    using e_append_zeros_def e_append_def
+    by (induction z) (simp_all add: replicate_append_same)
+  then show ?thesis by (simp add: r_append_zeros_def)
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/R1_BC.thy b/thys/Inductive_Inference/R1_BC.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/R1_BC.thy
@@ -0,0 +1,534 @@
+section \<open>@{term "\<R>"} is not in BC\label{s:r1_bc}\<close>
+
+theory R1_BC
+  imports Lemma_R
+    CP_FIN_NUM  (* for V0 *)
+begin
+
+text \<open>We show that @{term "U\<^sub>0 \<union> V\<^sub>0"} is not in BC,
+which implies @{term "\<R> \<notin> BC"}.
+
+The proof is by contradiction. Assume there is a strategy $S$ learning @{term
+"U\<^sub>0 \<union> V\<^sub>0"} behaviorally correct in the limit with respect to our
+standard Gödel numbering $\varphi$. Thanks to Lemma~R for BC we can assume
+$S$ to be total. Then we construct a function in @{term "U\<^sub>0 \<union> V\<^sub>0"} for
+which $S$ fails.
+
+As usual, there is a computable process building prefixes of functions
+$\psi_j$. For every $j$ it starts with the singleton prefix $b = [j]$ and
+computes the next prefix from a given prefix $b$ as follows:
+
+\begin{enumerate}
+\item Simulate $\varphi_{S(b0^k)}(|b| + k)$ for increasing $k$ for an
+  increasing number of steps.
+\item Once a $k$ with $\varphi_{S(b0^k)}(|b| + k) = 0$ is found, extend the
+  prefix by $0^k1$.
+\end{enumerate}
+
+There is always such a $k$ because by assumption $S$ learns $b0^\infty \in
+U_0$ and thus outputs a hypothesis for $b0^\infty$ on almost all of its
+prefixes. Therefore for almost all prefixes of the form $b0^k$, we have
+$\varphi_{S(b0^k)} = b0^\infty$ and hence $\varphi_{S(b0^k)}(|b| + k) = 0$.
+But Step~2 constructs $\psi_j$ such that $\psi_j(|b| + k) = 1$. Therefore $S$
+does not hypothesize $\psi_j$ on the prefix $b0^k$ of $\psi_j$. And since the
+process runs forever, $S$ outputs infinitely many incorrect hypotheses for
+$\psi_j$ and thus does not learn $\psi_j$.
+
+Applying Kleene's fixed-point theorem to @{term "\<psi> \<in> \<R>\<^sup>2"}
+yields a $j$ with $\varphi_j = \psi_j$ and thus $\psi_j \in V_0$. But $S$
+does not learn any $\psi_j$, contradicting our assumption.
+
+The result @{prop "\<R> \<notin> BC"} can be obtained more directly by
+running the process with the empty prefix, thereby constructing only one
+function instead of a numbering. This function is in @{term R1}, and $S$
+fails to learn it by the same reasoning as above. The stronger statement
+about @{term "U\<^sub>0 \<union> V\<^sub>0"} will be exploited in
+Section~\ref{s:union}.
+
+In the following locale the assumption that $S$ learns @{term "U\<^sub>0"}
+suffices for analyzing the process. However, in order to arrive at the
+desired contradiction this assumption is too weak because the functions built
+by the process are not in @{term "U\<^sub>0"}.\<close>
+
+locale r1_bc =
+  fixes s :: partial1
+  assumes s_in_R1: "s \<in> \<R>" and s_learn_U0: "learn_bc \<phi> U\<^sub>0 s"
+begin
+
+lemma s_learn_prenum: "\<And>b. learn_bc \<phi> {prenum b} s"
+  using s_learn_U0 U0_altdef learn_bc_closed_subseteq by blast
+
+text \<open>A @{typ recf} for the strategy:\<close>
+
+definition r_s :: recf where
+  "r_s \<equiv> SOME rs. recfn 1 rs \<and>  total rs \<and> s = (\<lambda>x. eval rs [x])"
+
+lemma r_s_recfn [simp]: "recfn 1 r_s"
+  and r_s_total: "\<And>x. eval r_s [x] \<down>"
+  and eval_r_s: "\<And>x. s x = eval r_s [x]"
+  using r_s_def R1_SOME[OF s_in_R1, of r_s] by simp_all
+
+text \<open>We begin with the function that finds the $k$ from Step~1 of the
+construction of $\psi$.\<close>
+
+definition "r_find_k \<equiv>
+  let k = Cn 2 r_pdec1 [Id 2 0];
+      r = Cn 2 r_result1
+        [Cn 2 r_pdec2 [Id 2 0],
+        Cn 2 r_s [Cn 2 r_append_zeros [Id 2 1, k]],
+        Cn 2 r_add [Cn 2 r_length [Id 2 1], k]]
+  in Cn 1 r_pdec1 [Mn 1 (Cn 2 r_eq [r, r_constn 1 1])]"
+
+lemma r_find_k_recfn [simp]: "recfn 1 r_find_k"
+  unfolding r_find_k_def by (simp add: Let_def)
+
+text \<open>There is always a suitable $k$, since the strategy learns
+$b0^\infty$ for all $b$.\<close>
+
+lemma learn_bc_prenum_eventually_zero:
+  "\<exists>k. \<phi> (the (s (e_append_zeros b k))) (e_length b + k) \<down>= 0"
+proof -
+  let ?f = "prenum b"
+  have "\<exists>n\<ge>e_length b. \<phi> (the (s (?f \<triangleright> n))) = ?f"
+    using learn_bcE s_learn_prenum by (meson le_cases singletonI)
+  then obtain n where n: "n \<ge> e_length b" "\<phi> (the (s (?f \<triangleright> n))) = ?f"
+    by auto
+  define k where "k = Suc n - e_length b"
+  let ?e = "e_append_zeros b k"
+  have len: "e_length ?e = Suc n"
+    using k_def n e_append_zeros_length by simp
+  have "?f \<triangleright> n = ?e"
+  proof -
+    have "e_length ?e > 0"
+      using len n(1) by simp
+    moreover have "?f x \<down>= e_nth ?e x" for x
+    proof (cases "x < e_length b")
+      case True
+      then show ?thesis using e_nth_append_zeros by simp
+    next
+      case False
+      then have "?f x \<down>= 0" by simp
+      moreover from False have "e_nth ?e x = 0"
+        using e_nth_append_zeros_big by simp
+      ultimately show ?thesis by simp
+    qed
+    ultimately show ?thesis using initI[of "?e"] len by simp
+  qed
+  with n(2) have "\<phi> (the (s ?e)) = ?f" by simp
+  then have "\<phi> (the (s ?e)) (e_length ?e) \<down>= 0"
+    using len n(1) by auto
+  then show ?thesis using e_append_zeros_length by auto
+qed
+
+lemma if_eq_eq: "(if v = 1 then (0 :: nat) else 1) = 0 \<Longrightarrow> v = 1"
+  by presburger
+
+lemma r_find_k:
+  shows "eval r_find_k [b] \<down>"
+    and "let k = the (eval r_find_k [b])
+           in \<phi> (the (s (e_append_zeros b k))) (e_length b + k) \<down>= 0"
+proof -
+  let ?k = "Cn 2 r_pdec1 [Id 2 0]"
+  let ?argt = "Cn 2 r_pdec2 [Id 2 0]"
+  let ?argi = "Cn 2 r_s [Cn 2 r_append_zeros [Id 2 1, ?k]]"
+  let ?argx = "Cn 2 r_add [Cn 2 r_length [Id 2 1], ?k]"
+  let ?r = "Cn 2 r_result1 [?argt, ?argi, ?argx]"
+  define f where "f \<equiv>
+    let k = Cn 2 r_pdec1 [Id 2 0];
+        r = Cn 2 r_result1
+             [Cn 2 r_pdec2 [Id 2 0],
+              Cn 2 r_s [Cn 2 r_append_zeros [Id 2 1, k]],
+              Cn 2 r_add [Cn 2 r_length [Id 2 1], k]]
+    in Cn 2 r_eq [r, r_constn 1 1]"
+  then have "recfn 2 f" by (simp add: Let_def)
+  have "total r_s"
+    by (simp add: r_s_total totalI1)
+  then have "total f"
+    unfolding f_def using Cn_total Mn_free_imp_total by (simp add: Let_def)
+
+  have "eval ?argi [z, b] = s (e_append_zeros b (pdec1 z))" for z
+    using r_append_zeros \<open>recfn 2 f\<close> eval_r_s by auto
+  then have "eval ?argi [z, b] \<down>= the (s (e_append_zeros b (pdec1 z)))" for z
+    using eval_r_s r_s_total by simp
+  moreover have "recfn 2 ?r" using \<open>recfn 2 f\<close> by auto
+  ultimately have r: "eval ?r [z, b] =
+      eval r_result1 [pdec2 z, the (s (e_append_zeros b (pdec1 z))), e_length b + pdec1 z]"
+      for z
+    by simp
+  then have f: "eval f [z, b] \<down>= (if the (eval ?r [z, b]) = 1 then 0 else 1)" for z
+    using f_def `recfn 2 f` prim_recfn_total by (auto simp add: Let_def)
+
+  have "\<exists>k. \<phi> (the (s (e_append_zeros b k))) (e_length b + k) \<down>= 0"
+    using s_learn_prenum learn_bc_prenum_eventually_zero by auto
+  then obtain k where "\<phi> (the (s (e_append_zeros b k))) (e_length b + k) \<down>= 0"
+    by auto
+  then obtain t where "eval r_result1 [t, the (s (e_append_zeros b k)), e_length b + k] \<down>= Suc 0"
+    using r_result1_converg_phi(1) by blast
+  then have t: "eval r_result1 [t, the (s (e_append_zeros b k)), e_length b + k] \<down>= Suc 0"
+    by simp
+
+  let ?z = "prod_encode (k, t)"
+  have "eval ?r [?z, b] \<down>= Suc 0"
+    using t r by (metis fst_conv prod_encode_inverse snd_conv)
+  with f have fzb: "eval f [?z, b] \<down>= 0" by simp
+  moreover have "eval (Mn 1 f) [b] =
+    (if (\<exists>z. eval f ([z, b]) \<down>= 0)
+     then Some (LEAST z. eval f [z, b] \<down>= 0)
+     else None)"
+    using eval_Mn_total[of 1 f "[b]"] `total f` `recfn 2 f` by simp
+  ultimately have mn1f: "eval (Mn 1 f) [b] \<down>= (LEAST z. eval f [z, b] \<down>= 0)"
+    by auto
+  with fzb have "eval f [the (eval (Mn 1 f) [b]), b] \<down>= 0" (is "eval f [?zz, b] \<down>= 0")
+    using \<open>total f\<close> \<open>recfn 2 f\<close> LeastI_ex[of "%z. eval f [z, b] \<down>= 0"] by auto
+  moreover have "eval f [?zz, b] \<down>= (if the (eval ?r [?zz, b]) = 1 then 0 else 1)"
+    using f by simp
+  ultimately have "(if the (eval ?r [?zz, b]) = 1 then (0 :: nat) else 1) = 0" by auto
+  then have "the (eval ?r [?zz, b]) = 1"
+    using if_eq_eq[of "the (eval ?r [?zz, b])"] by simp
+  then have
+     "eval r_result1
+        [pdec2 ?zz, the (s (e_append_zeros b (pdec1 ?zz))), e_length b + pdec1 ?zz] \<down>=
+      1"
+    using r r_result1_total r_result1_prim totalE
+    by (metis length_Cons list.size(3) numeral_3_eq_3 option.collapse)
+  then have *: "\<phi> (the (s (e_append_zeros b (pdec1 ?zz)))) (e_length b + pdec1 ?zz) \<down>= 0"
+    by (simp add: r_result1_some_phi)
+
+  define Mn1f where "Mn1f = Mn 1 f"
+  then have "eval Mn1f [b] \<down>= ?zz"
+    using mn1f by auto
+  moreover have "recfn 1 (Cn 1 r_pdec1 [Mn1f])"
+    using `recfn 2 f` Mn1f_def by simp
+  ultimately have "eval (Cn 1 r_pdec1 [Mn1f]) [b] = eval r_pdec1 [the (eval (Mn1f) [b])]"
+    by auto
+  then have "eval (Cn 1 r_pdec1 [Mn1f]) [b] = eval r_pdec1 [?zz]"
+    using Mn1f_def by blast
+  then have 1: "eval (Cn 1 r_pdec1 [Mn1f]) [b] \<down>= pdec1 ?zz"
+    by simp
+  moreover have "recfn 1 (Cn 1 S [Cn 1 r_pdec1 [Mn1f]])"
+    using `recfn 2 f` Mn1f_def by simp
+  ultimately have "eval (Cn 1 S [Cn 1 r_pdec1 [Mn1f]]) [b] =
+      eval S [the (eval (Cn 1 r_pdec1 [Mn1f]) [b])]"
+    by simp
+  then have "eval (Cn 1 S [Cn 1 r_pdec1 [Mn1f]]) [b] = eval S [pdec1 ?zz]"
+    using 1 by simp
+  then have "eval (Cn 1 S [Cn 1 r_pdec1 [Mn1f]]) [b] \<down>= Suc (pdec1 ?zz)"
+    by simp
+  moreover have "eval r_find_k [b] = eval (Cn 1 r_pdec1 [Mn1f]) [b]"
+    unfolding r_find_k_def Mn1f_def f_def by metis
+  ultimately have r_find_ksb: "eval r_find_k [b] \<down>= pdec1 ?zz"
+    using 1 by simp
+  then show "eval r_find_k [b] \<down>" by simp_all
+
+  from r_find_ksb have "the (eval r_find_k [b]) = pdec1 ?zz"
+    by simp
+  moreover have "\<phi> (the (s (e_append_zeros b (pdec1 ?zz)))) (e_length b + pdec1 ?zz) \<down>= 0"
+    using * by simp
+  ultimately show "let k = the (eval r_find_k [b])
+      in \<phi> (the (s (e_append_zeros b k))) (e_length b + k) \<down>= 0"
+    by simp
+qed
+
+lemma r_find_k_total: "total r_find_k"
+  by (simp add: s_learn_prenum r_find_k(1) totalI1)
+
+text \<open>The following function represents one iteration of the
+process.\<close>
+
+abbreviation "r_next \<equiv>
+  Cn 3 r_snoc [Cn 3 r_append_zeros [Id 3 1, Cn 3 r_find_k [Id 3 1]], r_constn 2 1]"
+
+text \<open>Using @{term r_next} we define the function @{term r_prefixes}
+that computes the prefix after every iteration of the process.\<close>
+
+definition r_prefixes :: recf where
+  "r_prefixes \<equiv> Pr 1 r_singleton_encode r_next"
+
+lemma r_prefixes_recfn: "recfn 2 r_prefixes"
+  unfolding r_prefixes_def by simp
+
+lemma r_prefixes_total: "total r_prefixes"
+proof -
+  have "recfn 3 r_next" by simp
+  then have "total r_next"
+    using `recfn 3 r_next` r_find_k_total Cn_total Mn_free_imp_total by auto
+  then show ?thesis
+    by (simp add: Mn_free_imp_total Pr_total r_prefixes_def)
+qed
+
+lemma r_prefixes_0: "eval r_prefixes [0, j] \<down>= list_encode [j]"
+  unfolding r_prefixes_def by simp
+
+lemma r_prefixes_Suc:
+  "eval r_prefixes [Suc n, j] \<down>=
+    (let b = the (eval r_prefixes [n, j])
+     in e_snoc (e_append_zeros b (the (eval r_find_k [b]))) 1)"
+proof -
+  have "recfn 3 r_next" by simp
+  then have "total r_next"
+    using `recfn 3 r_next` r_find_k_total Cn_total Mn_free_imp_total by auto
+  have eval_next: "eval r_next [t, v, j] \<down>=
+      e_snoc (e_append_zeros v (the (eval r_find_k [v]))) 1"
+      for t v j
+    using r_find_k_total `recfn 3 r_next` r_append_zeros by simp
+  then have "eval r_prefixes [Suc n, j] = eval r_next [n, the (eval r_prefixes [n, j]), j]"
+    using r_prefixes_total by (simp add: r_prefixes_def)
+  then show "eval r_prefixes [Suc n, j] \<down>=
+    (let b = the (eval r_prefixes [n, j])
+     in e_snoc (e_append_zeros b (the (eval r_find_k [b]))) 1)"
+    using eval_next by metis
+qed
+
+text \<open>Since @{term r_prefixes} is total, we can get away with
+introducing a total function.\<close>
+
+definition prefixes :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "prefixes j t \<equiv> the (eval r_prefixes [t, j])"
+
+lemma prefixes_Suc:
+  "prefixes j (Suc t) =
+    e_snoc (e_append_zeros (prefixes j t) (the (eval r_find_k [prefixes j t]))) 1"
+  unfolding prefixes_def using r_prefixes_Suc by (simp_all add: Let_def)
+
+lemma prefixes_Suc_length:
+  "e_length (prefixes j (Suc t)) =
+    Suc (e_length (prefixes j t) + the (eval r_find_k [prefixes j t]))"
+  using e_append_zeros_length prefixes_Suc by simp
+
+lemma prefixes_length_mono: "e_length (prefixes j t) < e_length (prefixes j (Suc t))"
+  using prefixes_Suc_length by simp
+
+lemma prefixes_length_mono': "e_length (prefixes j t) \<le> e_length (prefixes j (t + d))"
+proof (induction d)
+  case 0
+  then show ?case by simp
+next
+  case (Suc d)
+  then show ?case using prefixes_length_mono le_less_trans by fastforce
+qed
+
+lemma prefixes_length_lower_bound: "e_length (prefixes j t) \<ge> Suc t"
+proof (induction t)
+  case 0
+  then show ?case by (simp add: prefixes_def r_prefixes_0)
+next
+  case (Suc t)
+  moreover have "Suc (e_length (prefixes j t)) \<le> e_length (prefixes j (Suc t))"
+    using prefixes_length_mono by (simp add: Suc_leI)
+  ultimately show ?case by simp
+qed
+
+lemma prefixes_Suc_nth:
+  assumes "x < e_length (prefixes j t)"
+  shows "e_nth (prefixes j t) x = e_nth (prefixes j (Suc t)) x"
+proof -
+  define k where "k = the (eval r_find_k [prefixes j t])"
+  let ?u = "e_append_zeros (prefixes j t) k"
+  have "prefixes j (Suc t) =
+      e_snoc (e_append_zeros (prefixes j t) (the (eval r_find_k [prefixes j t]))) 1"
+    using prefixes_Suc by simp
+  with k_def have "prefixes j (Suc t) = e_snoc ?u 1"
+    by simp
+  then have "e_nth (prefixes j (Suc t)) x = e_nth (e_snoc ?u 1) x"
+    by simp
+  moreover have "x < e_length ?u"
+    using assms e_append_zeros_length by auto
+  ultimately have "e_nth (prefixes j (Suc t)) x = e_nth ?u x"
+    using e_nth_snoc_small by simp
+  moreover have "e_nth ?u x = e_nth (prefixes j t) x"
+    using assms e_nth_append_zeros by simp
+  ultimately show "e_nth (prefixes j t) x = e_nth (prefixes j (Suc t)) x"
+    by simp
+qed
+
+lemma prefixes_Suc_last: "e_nth (prefixes j (Suc t)) (e_length (prefixes j (Suc t)) - 1) = 1"
+  using prefixes_Suc by simp
+
+lemma prefixes_le_nth:
+  assumes "x < e_length (prefixes j t)"
+  shows "e_nth (prefixes j t) x = e_nth (prefixes j (t + d)) x"
+proof (induction d)
+  case 0
+  then show ?case by simp
+next
+  case (Suc d)
+  have "x < e_length (prefixes j (t + d))"
+    using s_learn_prenum assms prefixes_length_mono'
+    by (simp add: less_eq_Suc_le order_trans_rules(23))
+  then have "e_nth (prefixes j (t + d)) x = e_nth (prefixes j (t + Suc d)) x"
+    using prefixes_Suc_nth by simp
+  with Suc show ?case by simp
+qed
+
+text \<open>The numbering $\psi$ is defined via @{term[names_short] prefixes}.\<close>
+
+definition psi :: partial2 ("\<psi>") where
+  "\<psi> j x \<equiv> Some (e_nth (prefixes j (Suc x)) x)"
+
+lemma psi_in_R2: "\<psi> \<in> \<R>\<^sup>2"
+proof
+  define r where "r \<equiv>  Cn 2 r_nth [Cn 2 r_prefixes [Cn 2 S [Id 2 1], Id 2 0], Id 2 1]"
+  then have "recfn 2 r"
+    using r_prefixes_recfn by simp
+  then have "eval r [j, x] \<down>= e_nth (prefixes j (Suc x)) x" for j x
+    unfolding r_def prefixes_def using r_prefixes_total r_prefixes_recfn e_nth by simp
+  then have "eval r [j, x] = \<psi> j x" for j x
+    unfolding psi_def by simp
+  then show "\<psi> \<in> \<P>\<^sup>2"
+    using `recfn 2 r` by auto
+  show "total2 \<psi>"
+    unfolding psi_def by auto
+qed
+
+lemma psi_eq_nth_prefixes:
+  assumes "x < e_length (prefixes j t)"
+  shows "\<psi> j x \<down>= e_nth (prefixes j t) x"
+proof (cases "Suc x < t")
+  case True
+  have "x \<le> e_length (prefixes j x)"
+    using prefixes_length_lower_bound by (simp add: Suc_leD)
+  also have "... < e_length (prefixes j (Suc x))"
+    using prefixes_length_mono s_learn_prenum by simp
+  finally have "x < e_length (prefixes j (Suc x))" .
+  with True have "e_nth (prefixes j (Suc x)) x = e_nth (prefixes j t) x"
+    using prefixes_le_nth[of x j "Suc x" "t - Suc x"] by simp
+  then show ?thesis using psi_def by simp
+next
+  case False
+  then have "e_nth (prefixes j (Suc x)) x = e_nth (prefixes j t) x"
+    using prefixes_le_nth[of x j t "Suc x - t"] assms by simp
+  then show ?thesis using psi_def by simp
+qed
+
+lemma psi_at_0: "\<psi> j 0 \<down>= j"
+  using psi_eq_nth_prefixes[of 0 j 0] prefixes_length_lower_bound[of 0 j]
+  by (simp add: prefixes_def r_prefixes_0)
+
+text \<open>The prefixes output by the process @{term[names_short] "prefixes j"} are
+indeed prefixes of $\psi_j$.\<close>
+
+lemma prefixes_init_psi: "\<psi> j \<triangleright> (e_length (prefixes j (Suc t)) - 1) = prefixes j (Suc t)"
+proof (rule initI[of "prefixes j (Suc t)"])
+  let ?e = "prefixes j (Suc t)"
+  show "e_length ?e > 0"
+    using prefixes_length_lower_bound[of "Suc t" j] by auto
+  show "\<And>x. x < e_length ?e \<Longrightarrow> \<psi> j x \<down>= e_nth ?e x"
+    using prefixes_Suc_nth psi_eq_nth_prefixes by simp
+qed
+
+text \<open>Every prefix of $\psi_j$ generated by the process
+@{term[names_short] "prefixes j"} (except for the initial one) is of the form
+$b0^k1$. But $k$ is chosen such that $\varphi_{S(b0^k)}(|b|+k) = 0 \neq 1 =
+b0^k1_{|b|+k}$. Therefore the hypothesis $S(b0^k)$ is incorrect for
+$\psi_j$.\<close>
+
+lemma hyp_wrong_at_last:
+  "\<phi> (the (s (e_butlast (prefixes j (Suc t))))) (e_length (prefixes j (Suc t)) - 1) \<noteq>
+   \<psi> j (e_length (prefixes j (Suc t)) - 1)"
+  (is "?lhs \<noteq> ?rhs")
+proof -
+  let ?b = "prefixes j t"
+  let ?k = "the (eval r_find_k [?b])"
+  let ?x = "e_length (prefixes j (Suc t)) - 1"
+  have "e_butlast (prefixes j (Suc t)) = e_append_zeros ?b ?k"
+    using s_learn_prenum prefixes_Suc by simp
+  then have "?lhs = \<phi> (the (s (e_append_zeros ?b ?k))) ?x"
+    by simp
+  moreover have "?x = e_length ?b + ?k"
+    using prefixes_Suc_length by simp
+  ultimately have "?lhs = \<phi> (the (s (e_append_zeros ?b ?k))) (e_length ?b + ?k)"
+    by simp
+  then have "?lhs \<down>= 0"
+    using r_find_k(2) r_s_total s_learn_prenum by metis
+  moreover have "?x < e_length (prefixes j (Suc t))"
+    using prefixes_length_lower_bound le_less_trans linorder_not_le s_learn_prenum
+    by fastforce
+  ultimately have "?rhs \<down>= e_nth (prefixes j (Suc t)) ?x"
+    using psi_eq_nth_prefixes[of ?x j "Suc t"] by simp
+  moreover have "e_nth (prefixes j (Suc t)) ?x = 1"
+    using prefixes_Suc prefixes_Suc_last by simp
+  ultimately have "?rhs \<down>= 1" by simp
+  with `?lhs \<down>= 0` show ?thesis by simp
+qed
+
+corollary hyp_wrong: "\<phi> (the (s (e_butlast (prefixes j (Suc t))))) \<noteq> \<psi> j"
+  using hyp_wrong_at_last[of j t] by auto
+
+text \<open>For all $j$, the strategy $S$ outputs infinitely many wrong hypotheses for
+$\psi_j$\<close>
+
+lemma infinite_hyp_wrong: "\<exists>m>n. \<phi> (the (s (\<psi> j \<triangleright> m))) \<noteq> \<psi> j"
+proof -
+  let ?b = "prefixes j (Suc (Suc n))"
+  let ?bb = "e_butlast ?b"
+  have len_b: "e_length ?b > Suc (Suc n)"
+    using prefixes_length_lower_bound by (simp add: Suc_le_lessD)
+  then have len_bb: "e_length ?bb > Suc n" by simp
+  define m where "m = e_length ?bb - 1"
+  with len_bb have "m > n" by simp
+  have "\<psi> j \<triangleright> m = ?bb"
+  proof -
+    have "\<psi> j \<triangleright> (e_length ?b - 1) = ?b"
+      using prefixes_init_psi by simp
+    then have "\<psi> j \<triangleright> (e_length ?b - 2) = ?bb"
+      using init_butlast_init psi_in_R2 R2_proj_R1 R1_imp_total1 len_bb length_init
+      by (metis Suc_1 diff_diff_left length_butlast length_greater_0_conv
+        list.size(3) list_decode_encode not_less0 plus_1_eq_Suc)
+    then show ?thesis by (metis diff_Suc_1 length_init m_def)
+  qed
+  moreover have "\<phi> (the (s ?bb)) \<noteq> \<psi> j"
+    using hyp_wrong by simp
+  ultimately have "\<phi> (the (s (\<psi> j \<triangleright> m))) \<noteq> \<psi> j"
+    by simp
+  with `m > n` show ?thesis by auto
+qed
+
+lemma U0_V0_not_learn_bc: "\<not> learn_bc \<phi> (U\<^sub>0 \<union> V\<^sub>0) s"
+proof -
+  obtain j where j: "\<phi> j = \<psi> j"
+    using R2_imp_P2 kleene_fixed_point psi_in_R2 by blast
+  moreover have "\<exists>m>n. \<phi> (the (s ((\<psi> j) \<triangleright> m))) \<noteq> \<psi> j" for n
+    using infinite_hyp_wrong[of _ j] by simp
+  ultimately have "\<not> learn_bc \<phi> {\<psi> j} s"
+    using infinite_hyp_wrong_not_BC by simp
+  moreover have "\<psi> j \<in> V\<^sub>0"
+  proof -
+    have "\<psi> j \<in> \<R>" (is "?f \<in> \<R>")
+      using psi_in_R2 by simp
+    moreover have "\<phi> (the (?f 0)) = ?f"
+      using j psi_at_0[of j] by simp
+    ultimately show ?thesis by (simp add: V0_def)
+  qed
+  ultimately show "\<not> learn_bc \<phi> (U\<^sub>0 \<union> V\<^sub>0) s"
+    using learn_bc_closed_subseteq by auto
+qed
+
+end
+
+lemma U0_V0_not_in_BC: "U\<^sub>0 \<union> V\<^sub>0 \<notin> BC"
+proof
+  assume in_BC: "U\<^sub>0 \<union> V\<^sub>0 \<in> BC"
+  then have "U\<^sub>0 \<union> V\<^sub>0 \<in> BC_wrt \<phi>"
+    using BC_wrt_phi_eq_BC by simp
+  then obtain s where "learn_bc \<phi> (U\<^sub>0 \<union> V\<^sub>0) s"
+    using BC_wrt_def by auto
+  then obtain s' where s': "s' \<in> \<R>" "learn_bc \<phi> (U\<^sub>0 \<union> V\<^sub>0) s'"
+    using lemma_R_for_BC_simple by blast
+  then have learn_U0: "learn_bc \<phi> U\<^sub>0 s'"
+    using learn_bc_closed_subseteq[of \<phi> "U\<^sub>0 \<union> V\<^sub>0" "s'"] by simp
+  then interpret r1_bc s'
+    by (simp add: r1_bc_def s'(1))
+  have "\<not> learn_bc \<phi> (U\<^sub>0 \<union> V\<^sub>0) s'"
+    using learn_bc_closed_subseteq U0_V0_not_learn_bc by simp
+  with s'(2) show False by simp
+qed
+
+theorem R1_not_in_BC: "\<R> \<notin> BC"
+proof -
+  have "U\<^sub>0 \<union> V\<^sub>0 \<subseteq> \<R>"
+    using V0_def U0_in_NUM by auto
+  then show ?thesis
+    using U0_V0_not_in_BC BC_closed_subseteq by auto
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/ROOT b/thys/Inductive_Inference/ROOT
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/ROOT
@@ -0,0 +1,21 @@
+chapter AFP
+
+session Inductive_Inference (AFP) = HOL +
+  options [timeout = 600]
+  sessions
+    "HOL-Library"
+  theories
+    Partial_Recursive
+    Universal
+    Standard_Results
+    Inductive_Inference_Basics
+    CP_FIN_NUM
+    CONS_LIM
+    Lemma_R
+    LIM_BC
+    TOTAL_CONS
+    R1_BC
+    Union
+  document_files
+    "root.tex"
+    "root.bib"
diff --git a/thys/Inductive_Inference/Standard_Results.thy b/thys/Inductive_Inference/Standard_Results.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/Standard_Results.thy
@@ -0,0 +1,1594 @@
+theory Standard_Results
+  imports Universal
+begin
+
+section \<open>Kleene normal form and the number of $\mu$-operations\<close>
+
+text \<open>Kleene's original normal form theorem~\cite{Kleene43} states that
+every partial recursive $f$ can be expressed as $f(x) = u(\mu y[t(i, x, y) =
+0]$ for some $i$, where $u$ and $t$ are specially crafted primitive recursive
+functions tied to Kleene's definition of partial recursive functions.
+Rogers~\cite[p.~29f.]{Rogers87} relaxes the theorem by allowing $u$ and $t$
+to be any primitive recursive functions of arity one and three, respectively.
+Both versions require a separate $t$-predicate for every arity. We will show
+a unified version for all arities by treating $x$ as an encoded list of
+arguments.
+
+Our universal function @{thm[display,names_short] "r_univ_def"} can represent
+all partial recursive functions (see theorem @{thm[source] r_univ}). Moreover
+@{term "r_result"}, @{term "r_dec"}, and @{term "r_not"} are primitive
+recursive. As such @{term r_univ} could almost serve as the right-hand side
+$u(\mu y[t(i, x, y) = 0]$. Its only flaw is that the outer function, the
+composition of @{term r_dec} and @{term r_result}, is ternary rather than
+unary.\<close>
+
+lemma r_univ_almost_kleene_nf:
+  "r_univ \<simeq>
+   (let u = Cn 3 r_dec [r_result];
+        t = Cn 3 r_not [r_result]
+    in Cn 2 u [Mn 2 t, Id 2 0, Id 2 1])"
+  unfolding r_univ_def by (rule exteqI) simp_all
+
+text \<open>We can remedy the wrong arity with some encoding and
+projecting.\<close>
+
+definition r_nf_t :: recf where
+  "r_nf_t \<equiv> Cn 3 r_and
+    [Cn 3 r_eq [Cn 3 r_pdec2 [Id 3 0], Cn 3 r_prod_encode [Id 3 1, Id 3 2]],
+     Cn 3 r_not
+      [Cn 3 r_result
+        [Cn 3 r_pdec1 [Id 3 0],
+         Cn 3 r_pdec12 [Id 3 0],
+         Cn 3 r_pdec22 [Id 3 0]]]]"
+
+lemma r_nf_t_prim: "prim_recfn 3 r_nf_t"
+  unfolding r_nf_t_def by simp
+
+definition r_nf_u :: recf where
+  "r_nf_u \<equiv> Cn 1 r_dec [Cn 1 r_result [r_pdec1, r_pdec12, r_pdec22]]"
+
+lemma r_nf_u_prim: "prim_recfn 1 r_nf_u"
+  unfolding r_nf_u_def by simp
+
+lemma r_nf_t_0:
+  assumes "eval r_result [pdec1 y, pdec12 y, pdec22 y] \<down>\<noteq> 0"
+    and "pdec2 y = prod_encode (i, x)"
+  shows "eval r_nf_t [y, i, x] \<down>= 0"
+  unfolding r_nf_t_def using assms by auto
+
+lemma r_nf_t_1:
+  assumes "eval r_result [pdec1 y, pdec12 y, pdec22 y] \<down>= 0 \<or> pdec2 y \<noteq> prod_encode (i, x)"
+  shows "eval r_nf_t [y, i, x] \<down>= 1"
+  unfolding r_nf_t_def using assms r_result_total by auto
+
+text \<open>The next function is just as universal as @{term r_univ}, but
+satisfies the conditions of the Kleene normal form theorem because the
+outer funtion @{term r_nf_u} is unary.\<close>
+
+definition "r_normal_form \<equiv> Cn 2 r_nf_u [Mn 2 r_nf_t]"
+
+lemma r_normal_form_recfn: "recfn 2 r_normal_form"
+  unfolding r_normal_form_def using r_nf_u_prim r_nf_t_prim by simp
+
+lemma r_univ_exteq_r_normal_form: "r_univ \<simeq> r_normal_form"
+proof (rule exteqI)
+  show arity: "arity r_univ = arity r_normal_form"
+    using r_normal_form_recfn by simp
+  show "eval r_univ xs = eval r_normal_form xs" if "length xs = arity r_univ" for xs
+  proof -
+    have "length xs = 2"
+      using that by simp
+    then obtain i x where ix: "[i, x] = xs"
+      by (metis length_0_conv length_Suc_conv numeral_2_eq_2)
+    have "eval r_univ [i, x] = eval r_normal_form [i, x]"
+    proof (cases "\<forall>t. eval r_result [t, i, x] \<down>= 0")
+      case True
+      then have "eval r_univ [i, x] \<up>"
+        unfolding r_univ_def by simp
+      moreover have "eval r_normal_form [i, x] \<up>"
+      proof -
+        have "eval r_nf_t [y, i, x] \<down>= 1" for y
+          using True r_nf_t_1[of y i x] by fastforce
+        then show ?thesis
+          unfolding r_normal_form_def using r_nf_u_prim r_nf_t_prim by simp
+      qed
+      ultimately show ?thesis by simp
+    next
+      case False
+      then have "\<exists>t. eval r_result [t, i, x] \<down>\<noteq> 0"
+        by (simp add: r_result_total)
+      then obtain t where "eval r_result [t, i, x] \<down>\<noteq> 0"
+        by auto
+      then have "eval r_nf_t [triple_encode t i x, i, x] \<down>= 0"
+        using r_nf_t_0 by simp
+      then obtain y where y: "eval (Mn 2 r_nf_t) [i, x] \<down>= y"
+        using r_nf_t_prim Mn_free_imp_total by fastforce
+      then have "eval r_nf_t [y, i, x] \<down>= 0"
+        using r_nf_t_prim Mn_free_imp_total eval_Mn_convergE(2)[of 2 r_nf_t "[i, x]" y]
+        by simp
+      then have r_result: "eval r_result [pdec1 y, pdec12 y, pdec22 y] \<down>\<noteq> 0"
+        and pdec2: "pdec2 y = prod_encode (i, x)"
+        using r_nf_t_0[of y i x] r_nf_t_1[of y i x] r_result_total by auto
+      then have "eval r_result [pdec1 y, i, x] \<down>\<noteq> 0"
+        by simp
+      then obtain v where v:
+          "eval r_univ [pdec12 y, pdec22 y] \<down>= v"
+          "eval r_result [pdec1 y, pdec12 y, pdec22 y] \<down>= Suc v"
+        using r_result r_result_bivalent'[of "pdec12 y" "pdec22 y" _ "pdec1 y"]
+          r_result_diverg'[of "pdec12 y" "pdec22 y" "pdec1 y"]
+        by auto
+      
+      have "eval r_normal_form [i, x] = eval r_nf_u [y]"
+        unfolding r_normal_form_def using y r_nf_t_prim r_nf_u_prim by simp
+      also have "... = eval r_dec [the (eval (Cn 1 r_result [r_pdec1, r_pdec12, r_pdec22]) [y])]"
+        unfolding r_nf_u_def using r_result by simp
+      also have "... = eval r_dec [Suc v]"
+        using v by simp
+      also have "... \<down>= v"
+        by simp
+      finally have "eval r_normal_form [i, x] \<down>= v" .
+      moreover have "eval r_univ [i, x] \<down>= v"
+        using v(1) pdec2 by simp
+      ultimately show ?thesis by simp
+    qed
+    with ix show ?thesis by simp
+  qed
+qed
+
+theorem normal_form:
+  assumes "recfn n f"
+  obtains i where "\<forall>x. e_length x = n \<longrightarrow> eval r_normal_form [i, x] = eval f (list_decode x)"
+proof -
+  have "eval r_normal_form [encode f, x] = eval f (list_decode x)" if "e_length x = n" for x
+    using r_univ_exteq_r_normal_form assms that exteq_def r_univ' by auto
+  then show ?thesis using that by auto
+qed
+
+text \<open>As a consequence of the normal form theorem every partial
+recursive function can be represented with exactly one application of the
+$\mu$-operator.\<close>
+
+fun count_Mn :: "recf \<Rightarrow> nat" where
+  "count_Mn Z = 0"
+| "count_Mn S = 0"
+| "count_Mn (Id m n) = 0"
+| "count_Mn (Cn n f gs) = count_Mn f + sum_list (map count_Mn gs)"
+| "count_Mn (Pr n f g) = count_Mn f + count_Mn g"
+| "count_Mn (Mn n f) = Suc (count_Mn f)"
+
+lemma count_Mn_zero_iff_prim: "count_Mn f = 0 \<longleftrightarrow> Mn_free f"
+  by (induction f) auto
+
+text \<open>The normal form has only one $\mu$-recursion.\<close>
+
+lemma count_Mn_normal_form: "count_Mn r_normal_form = 1"
+  unfolding r_normal_form_def r_nf_u_def r_nf_t_def using count_Mn_zero_iff_prim by simp
+
+lemma one_Mn_suffices:
+  assumes "recfn n f"
+  shows "\<exists>g. count_Mn g = 1 \<and> g \<simeq> f"
+proof -
+  have "n > 0"
+    using assms wellf_arity_nonzero by auto
+  obtain i where i:
+    "\<forall>x. e_length x = n \<longrightarrow> eval r_normal_form [i, x] = eval f (list_decode x)"
+    using normal_form[OF assms(1)] by auto
+  define g where "g \<equiv> Cn n r_normal_form [r_constn (n - 1) i, r_list_encode (n - 1)]"
+  then have "recfn n g"
+    using r_normal_form_recfn `n > 0` by simp
+  then have "g \<simeq> f"
+    using g_def r_list_encode i assms by (intro exteqI) simp_all
+  moreover have "count_Mn g = 1"
+    unfolding g_def using count_Mn_normal_form count_Mn_zero_iff_prim by simp
+  ultimately show ?thesis by auto
+qed
+
+text \<open>The previous lemma could have been obtained without @{term
+"r_normal_form"} directly from @{term "r_univ"}.\<close>
+
+
+section \<open>The $s$-$m$-$n$ theorem\<close>
+
+text \<open>For all $m, n > 0$ there is an $(m + 1)$-ary primitive recursive
+function $s^m_n$ with
+\[
+  \varphi_p^{(m + n)}(c_1, \dots,c_m, x_1, \dots, x_n) =
+  \varphi_{s^m_n(p, c_1, \dots,c_m)}^{(n)}(x_1, \dots, x_n)
+\]
+for all $p, c_1, \ldots, c_m, x_1, \ldots, x_n$. Here, $\varphi^{(n)}$ is a
+function universal for $n$-ary partial recursive functions, which we will
+represent by @{term "r_universal n"}\<close>
+
+text \<open>The $s^m_n$ functions compute codes of functions. We start simple:
+computing codes of the unary constant functions.\<close>
+
+fun code_const1 :: "nat \<Rightarrow> nat" where
+  "code_const1 0 = 0"
+| "code_const1 (Suc c) = quad_encode 3 1 1 (singleton_encode (code_const1 c))"
+
+lemma code_const1: "code_const1 c = encode (r_const c)"
+  by (induction c) simp_all
+
+definition "r_code_const1_aux \<equiv>
+  Cn 3 r_prod_encode
+    [r_constn 2 3,
+      Cn 3 r_prod_encode
+        [r_constn 2 1,
+          Cn 3 r_prod_encode
+            [r_constn 2 1, Cn 3 r_singleton_encode [Id 3 1]]]]"
+
+lemma r_code_const1_aux_prim: "prim_recfn 3 r_code_const1_aux"
+  by (simp_all add: r_code_const1_aux_def)
+
+lemma r_code_const1_aux:
+  "eval r_code_const1_aux [i, r, c] \<down>= quad_encode 3 1 1 (singleton_encode r)"
+  by (simp add: r_code_const1_aux_def)
+
+definition "r_code_const1 \<equiv> r_shrink (Pr 1 Z r_code_const1_aux)"
+
+lemma r_code_const1_prim: "prim_recfn 1 r_code_const1"
+  by (simp_all add: r_code_const1_def r_code_const1_aux_prim)
+
+lemma r_code_const1: "eval r_code_const1 [c] \<down>= code_const1 c"
+proof -
+  let ?h = "Pr 1 Z r_code_const1_aux"
+  have "eval ?h [c, x] \<down>= code_const1 c" for x
+    using r_code_const1_aux r_code_const1_def
+    by (induction c) (simp_all add: r_code_const1_aux_prim)
+  then show ?thesis by (simp add: r_code_const1_def r_code_const1_aux_prim)
+qed
+
+text \<open>Functions that compute codes of higher-arity constant functions:\<close>
+
+definition code_constn :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "code_constn n c \<equiv>
+    if n = 1 then code_const1 c
+    else quad_encode 3 n (code_const1 c) (singleton_encode (triple_encode 2 n 0))"
+
+lemma code_constn: "code_constn (Suc n) c = encode (r_constn n c)"
+  unfolding code_constn_def using code_const1 r_constn_def
+  by (cases "n = 0") simp_all
+
+definition r_code_constn :: "nat \<Rightarrow> recf" where
+  "r_code_constn n \<equiv>
+     if n = 1 then r_code_const1
+     else
+       Cn 1 r_prod_encode
+        [r_const 3,
+         Cn 1 r_prod_encode
+          [r_const n,
+           Cn 1 r_prod_encode
+            [r_code_const1,
+             Cn 1 r_singleton_encode
+              [Cn 1 r_prod_encode
+                [r_const 2, Cn 1 r_prod_encode [r_const n, Z]]]]]]"
+
+lemma r_code_constn_prim: "prim_recfn 1 (r_code_constn n)"
+  by (simp_all add: r_code_constn_def r_code_const1_prim)
+
+lemma r_code_constn: "eval (r_code_constn n) [c] \<down>= code_constn n c"
+  by (auto simp add: r_code_constn_def r_code_const1 code_constn_def r_code_const1_prim)
+
+text \<open>Computing codes of $m$-ary projections:\<close>
+
+definition code_id :: "nat \<Rightarrow> nat \<Rightarrow> nat" where
+  "code_id m n \<equiv> triple_encode 2 m n"
+
+lemma code_id: "encode (Id m n) = code_id m n"
+  unfolding code_id_def by simp
+
+text \<open>The functions $s^m_n$ are represented by the following function.
+The value $m$ corresponds to the length of @{term "cs"}.\<close>
+
+definition smn :: "nat \<Rightarrow> nat \<Rightarrow> nat list \<Rightarrow> nat" where
+  "smn n p cs \<equiv> quad_encode
+     3
+     n
+     (encode (r_universal (n + length cs)))
+     (list_encode (code_constn n p # map (code_constn n) cs @ map (code_id n) [0..<n]))"
+
+lemma smn:
+  assumes "n > 0"
+  shows "smn n p cs = encode
+   (Cn n
+     (r_universal (n + length cs))
+     (r_constn (n - 1) p # map (r_constn (n - 1)) cs @ (map (Id n) [0..<n])))"
+proof -
+  let ?p = "r_constn (n - 1) p"
+  let ?gs1 = "map (r_constn (n - 1)) cs"
+  let ?gs2 = "map (Id n) [0..<n]"
+  let ?gs = "?p # ?gs1 @ ?gs2"
+  have "map encode ?gs1 = map (code_constn n) cs"
+    by (intro nth_equalityI; auto; metis code_constn assms Suc_pred)
+  moreover have "map encode ?gs2 = map (code_id n) [0..<n]"
+    by (rule nth_equalityI) (auto simp add: code_id_def)
+  moreover have "encode ?p = code_constn n p"
+    using assms code_constn[of "n - 1" p] by simp
+  ultimately have "map encode ?gs =
+      code_constn n p # map (code_constn n) cs @ map (code_id n) [0..<n]"
+    by simp
+  then show ?thesis
+    unfolding smn_def using assms encode.simps(4) by presburger
+qed
+
+text \<open>The next function is to help us define @{typ recf}s corresponding
+to the $s^m_n$ functions. It maps $m + 1$ arguments $p, c_1, \ldots, c_m$ to
+an encoded list of length $m + n + 1$. The list comprises the $m + 1$ codes
+of the $n$-ary constants $p, c_1, \ldots, c_m$ and the $n$ codes for all
+$n$-ary projections.\<close>
+
+definition r_smn_aux :: "nat \<Rightarrow> nat \<Rightarrow> recf" where
+  "r_smn_aux n m \<equiv>
+     Cn (Suc m)
+      (r_list_encode (m + n))
+      (map (\<lambda>i. Cn (Suc m) (r_code_constn n) [Id (Suc m) i]) [0..<Suc m] @
+       map (\<lambda>i. r_constn m (code_id n i)) [0..<n])"
+
+lemma r_smn_aux_prim: "n > 0 \<Longrightarrow> prim_recfn (Suc m) (r_smn_aux n m)"
+  by (auto simp add: r_smn_aux_def r_code_constn_prim)
+
+lemma r_smn_aux:
+  assumes "n > 0" and "length cs = m"
+  shows "eval (r_smn_aux n m) (p # cs) \<down>=
+    list_encode (map (code_constn n) (p # cs) @ map (code_id n) [0..<n])"
+proof -
+  let ?xs = "map (\<lambda>i. Cn (Suc m) (r_code_constn n) [Id (Suc m) i]) [0..<Suc m]"
+  let ?ys = "map (\<lambda>i. r_constn m (code_id n i)) [0..<n]"
+  have len_xs: "length ?xs = Suc m" by simp
+
+  have map_xs: "map (\<lambda>g. eval g (p # cs)) ?xs = map Some (map (code_constn n) (p # cs))"
+  proof (intro nth_equalityI)
+    show len: "length (map (\<lambda>g. eval g (p # cs)) ?xs) =
+        length (map Some (map (code_constn n) (p # cs)))"
+      by (simp add: assms(2))
+
+    have "map (\<lambda>g. eval g (p # cs)) ?xs ! i = map Some (map (code_constn n) (p # cs)) ! i"
+        if "i < Suc m" for i
+    proof -
+      have "map (\<lambda>g. eval g (p # cs)) ?xs ! i = (\<lambda>g. eval g (p # cs)) (?xs ! i)"
+        using len_xs that by (metis nth_map)
+      also have "... = eval (Cn (Suc m) (r_code_constn n) [Id (Suc m) i]) (p # cs)"
+        using that len_xs
+        by (metis (no_types, lifting) add.left_neutral length_map nth_map nth_upt)
+      also have "... = eval (r_code_constn n) [the (eval (Id (Suc m) i) (p # cs))]"
+        using r_code_constn_prim assms(2) that by simp
+      also have "... = eval (r_code_constn n) [(p # cs) ! i]"
+        using len that by simp
+      finally have "map (\<lambda>g. eval g (p # cs)) ?xs ! i \<down>= code_constn n ((p # cs) ! i)"
+        using r_code_constn by simp
+      then show ?thesis
+        using len_xs len that by (metis length_map nth_map)
+    qed
+    moreover have "length (map (\<lambda>g. eval g (p # cs)) ?xs) = Suc m" by simp
+    ultimately show "\<And>i. i < length (map (\<lambda>g. eval g (p # cs)) ?xs) \<Longrightarrow>
+        map (\<lambda>g. eval g (p # cs)) ?xs ! i =
+        map Some (map (code_constn n) (p # cs)) ! i"
+      by simp
+  qed
+  moreover have "map (\<lambda>g. eval g (p # cs)) ?ys = map Some (map (code_id n) [0..<n])"
+    using assms(2) by (intro nth_equalityI; auto)
+  ultimately have "map (\<lambda>g. eval g (p # cs)) (?xs @ ?ys) =
+      map Some (map (code_constn n) (p # cs) @ map (code_id n) [0..<n])"
+    by (metis map_append)
+  moreover have "map (\<lambda>x. the (eval x (p # cs))) (?xs @ ?ys) =
+      map the (map (\<lambda>x. eval x (p # cs)) (?xs @ ?ys))"
+    by simp
+  ultimately have *: "map (\<lambda>g. the (eval g (p # cs))) (?xs @ ?ys) =
+      (map (code_constn n) (p # cs) @ map (code_id n) [0..<n])"
+    by simp
+
+  have "\<forall>i<length ?xs. eval (?xs ! i) (p # cs) = map (\<lambda>g. eval g (p # cs)) ?xs ! i"
+    by (metis nth_map)
+  then have
+    "\<forall>i<length ?xs. eval (?xs ! i) (p # cs) = map Some (map (code_constn n) (p # cs)) ! i"
+    using map_xs by simp
+  then have "\<forall>i<length ?xs. eval (?xs ! i) (p # cs) \<down>"
+    using assms map_xs by (metis length_map nth_map option.simps(3))
+  then have xs_converg: "\<forall>z\<in>set ?xs. eval z (p # cs) \<down>"
+    by (metis in_set_conv_nth)
+
+  have "\<forall>i<length ?ys. eval (?ys ! i) (p # cs) = map (\<lambda>x. eval x (p # cs)) ?ys ! i"
+    by simp
+  then have
+    "\<forall>i<length ?ys. eval (?ys ! i) (p # cs) = map Some (map (code_id n) [0..<n]) ! i"
+    using assms(2) by simp
+  then have "\<forall>i<length ?ys. eval (?ys ! i) (p # cs) \<down>"
+    by simp
+  then have "\<forall>z\<in>set (?xs @ ?ys). eval z (p # cs) \<down>"
+    using xs_converg by auto
+  moreover have "recfn (length (p # cs)) (Cn (Suc m) (r_list_encode (m + n)) (?xs @ ?ys))"
+    using assms r_code_constn_prim by auto
+  ultimately have "eval (r_smn_aux n m) (p # cs) =
+      eval (r_list_encode (m + n)) (map (\<lambda>g. the (eval g (p # cs))) (?xs @ ?ys))"
+    unfolding r_smn_aux_def using assms by simp
+  then have "eval (r_smn_aux n m) (p # cs) =
+      eval (r_list_encode (m + n)) (map (code_constn n) (p # cs) @ map (code_id n) [0..<n])"
+    using * by metis
+  moreover have "length (?xs @ ?ys) = Suc (m + n)" by simp
+  ultimately show ?thesis
+    using r_list_encode * assms(1) by (metis (no_types, lifting) length_map)
+qed
+
+text \<open>For all $m, n > 0$, the @{typ recf} corresponding to $s^m_n$ is
+given by the next function.\<close>
+
+definition r_smn :: "nat \<Rightarrow> nat \<Rightarrow> recf" where
+ "r_smn n m \<equiv>
+    Cn (Suc m) r_prod_encode
+     [r_constn m 3,
+      Cn (Suc m) r_prod_encode
+       [r_constn m n,
+        Cn (Suc m) r_prod_encode
+          [r_constn m (encode (r_universal (n + m))), r_smn_aux n m]]]"
+
+lemma r_smn_prim [simp]: "n > 0 \<Longrightarrow> prim_recfn (Suc m) (r_smn n m)"
+  by (simp_all add: r_smn_def r_smn_aux_prim)
+
+lemma r_smn:
+  assumes "n > 0" and "length cs = m"
+  shows "eval (r_smn n m) (p # cs) \<down>= smn n p cs"
+  using assms r_smn_def r_smn_aux smn_def r_smn_aux_prim by simp
+
+lemma map_eval_Some_the:
+  assumes "map (\<lambda>g. eval g xs) gs = map Some ys"
+  shows "map (\<lambda>g. the (eval g xs)) gs = ys"
+  using assms
+  by (metis (no_types, lifting) length_map nth_equalityI nth_map option.sel)
+
+text \<open>The essential part of the $s$-$m$-$n$ theorem: For all $m, n > 0$
+the function $s^m_n$ satisfies
+\[
+  \varphi_p^{(m + n)}(c_1, \dots,c_m, x_1, \dots, x_n) =
+  \varphi_{s^m_n(p, c_1, \dots,c_m)}^{(n)}(x_1, \dots, x_n)
+\] for all $p, c_i, x_j$.\<close>
+
+lemma smn_lemma:
+  assumes "n > 0" and len_cs: "length cs = m" and len_xs: "length xs = n"
+  shows "eval (r_universal (m + n)) (p # cs @ xs) =
+    eval (r_universal n) ((the (eval (r_smn n m) (p # cs))) # xs)"
+proof -
+  let ?s = "r_smn n m"
+  let ?f = "Cn n
+    (r_universal (n + length cs))
+    (r_constn (n - 1) p # map (r_constn (n - 1)) cs @ (map (Id n) [0..<n]))"
+  have "eval ?s (p # cs) \<down>= smn n p cs"
+    using assms r_smn by simp
+  then have eval_s: "eval ?s (p # cs) \<down>= encode ?f"
+    by (simp add: assms(1) smn)
+
+  have "recfn n ?f"
+    using len_cs assms by auto
+  then have *: "eval (r_universal n) ((encode ?f) # xs) = eval ?f xs"
+    using r_universal[of ?f n, OF _ len_xs] by simp
+
+  let ?gs = "r_constn (n - 1) p # map (r_constn (n - 1)) cs @ map (Id n) [0..<n]"
+  have "\<forall>g\<in>set ?gs. eval g xs \<down>"
+    using len_cs len_xs assms by auto
+  then have "eval ?f xs =
+      eval (r_universal (n + length cs)) (map (\<lambda>g. the (eval g xs)) ?gs)"
+    using len_cs len_xs assms `recfn n ?f` by simp
+  then have "eval ?f xs = eval (r_universal (m + n)) (map (\<lambda>g. the (eval g xs)) ?gs)"
+    by (simp add: len_cs add.commute)
+  then have "eval (r_universal n) ((the (eval ?s (p # cs))) # xs) =
+      eval (r_universal (m + n)) (map (\<lambda>g. the (eval g xs)) ?gs)"
+    using eval_s * by simp
+  moreover have "map (\<lambda>g. the (eval g xs)) ?gs = p # cs @ xs"
+  proof (intro nth_equalityI)
+    show "length (map (\<lambda>g. the (eval g xs)) ?gs) = length (p # cs @ xs)"
+      by (simp add: len_xs)
+    have len: "length (map (\<lambda>g. the (eval g xs)) ?gs) = Suc (m + n)"
+      by (simp add: len_cs)
+    moreover have "map (\<lambda>g. the (eval g xs)) ?gs ! i = (p # cs @ xs) ! i"
+      if "i < Suc (m + n)" for i
+    proof -
+      from that consider "i = 0" | "i > 0 \<and> i < Suc m" | "Suc m \<le> i \<and> i < Suc (m + n)"
+        using not_le_imp_less by auto
+      then show ?thesis
+      proof (cases)
+        case 1
+        then show ?thesis using assms(1) len_xs by simp
+      next
+        case 2
+        then have "?gs ! i = (map (r_constn (n - 1)) cs) ! (i - 1)"
+          using len_cs
+          by (metis One_nat_def Suc_less_eq Suc_pred length_map
+            less_numeral_extra(3) nth_Cons' nth_append)
+        then have "map (\<lambda>g. the (eval g xs)) ?gs ! i =
+            (\<lambda>g. the (eval g xs)) ((map (r_constn (n - 1)) cs) ! (i - 1))"
+          using len by (metis length_map nth_map that)
+        also have "... = the (eval ((r_constn (n - 1) (cs ! (i - 1)))) xs)"
+          using 2 len_cs by auto
+        also have "... = cs ! (i - 1)"
+          using r_constn len_xs assms(1) by simp
+        also have "... = (p # cs @ xs) ! i"
+          using 2 len_cs
+          by (metis diff_Suc_1 less_Suc_eq_0_disj less_numeral_extra(3) nth_Cons' nth_append)
+        finally show ?thesis .
+      next
+        case 3
+        then have "?gs ! i = (map (Id n) [0..<n]) ! (i - Suc m)"
+          using len_cs 
+          by (simp; metis (no_types, lifting) One_nat_def Suc_less_eq add_leE
+            plus_1_eq_Suc diff_diff_left length_map not_le nth_append
+            ordered_cancel_comm_monoid_diff_class.add_diff_inverse)
+        then have "map (\<lambda>g. the (eval g xs)) ?gs ! i =
+            (\<lambda>g. the (eval g xs)) ((map (Id n) [0..<n]) ! (i - Suc m))"
+          using len by (metis length_map nth_map that)
+        also have "... = the (eval ((Id n (i - Suc m))) xs)"
+          using 3 len_cs by auto
+        also have "... = xs ! (i - Suc m)"
+          using len_xs 3 by auto
+        also have "... = (p # cs @ xs) ! i"
+          using len_cs len_xs 3
+          by (metis diff_Suc_1 diff_diff_left less_Suc_eq_0_disj not_le nth_Cons'
+            nth_append plus_1_eq_Suc)
+        finally show ?thesis .
+      qed
+    qed
+    ultimately show "map (\<lambda>g. the (eval g xs)) ?gs ! i = (p # cs @ xs) ! i"
+        if "i < length (map (\<lambda>g. the (eval g xs)) ?gs)" for i
+      using that by simp
+  qed
+  ultimately show ?thesis by simp
+qed
+
+theorem smn_theorem:
+  assumes "n > 0"
+  shows "\<exists>s. prim_recfn (Suc m) s \<and>
+    (\<forall>p cs xs. length cs = m \<and> length xs = n \<longrightarrow>
+        eval (r_universal (m + n)) (p # cs @ xs) =
+        eval (r_universal n) ((the (eval s (p # cs))) # xs))"
+  using smn_lemma exI[of _ "r_smn n m"] assms by simp
+
+text \<open>For every numbering, that is, binary partial recursive function,
+$\psi$ there is a total recursive function $c$ that translates $\psi$-indices
+into $\varphi$-indices.\<close>
+
+lemma numbering_translation:
+  assumes "recfn 2 psi"
+  obtains c where
+    "recfn 1 c"
+    "total c"
+    "\<forall>i x. eval psi [i, x] = eval r_phi [the (eval c [i]), x]"
+proof -
+  let ?p = "encode psi"
+  define c where "c = Cn 1 (r_smn 1 1) [r_const ?p, Id 1 0]"
+  then have "prim_recfn 1 c" by simp
+  moreover from this have "total c"
+    by auto
+  moreover have "eval r_phi [the (eval c [i]), x] = eval psi [i, x]" for i x
+  proof -
+    have "eval c [i] = eval (r_smn 1 1) [?p, i]"
+      using c_def by simp
+    then have "eval (r_universal 1) [the (eval c [i]), x] =
+        eval (r_universal 1) [the (eval (r_smn 1 1) [?p, i]), x]"
+      by simp
+    also have "... = eval (r_universal (1 + 1)) (?p # [i] @ [x])"
+      using smn_lemma[of 1 "[i]" 1 "[x]" ?p] by simp
+    also have "... = eval (r_universal 2) [?p, i, x]"
+      by (metis append_eq_Cons_conv nat_1_add_1)
+    also have "... = eval psi [i, x]"
+      using r_universal[OF assms, of "[i, x]"] by simp
+    finally have "eval (r_universal 1) [the (eval c [i]), x] = eval psi [i, x]" .
+    then show ?thesis using r_phi_def by simp
+  qed
+  ultimately show ?thesis using that by auto
+qed
+
+
+section \<open>Fixed-point theorems\<close>
+
+text \<open>Fixed-point theorems (also known as recursion theorems) come in
+many shapes. We prove the minimum we need for Chapter~\ref{c:iirf}.\<close>
+
+
+subsection \<open>Rogers's fixed-point theorem\<close>
+
+text \<open>In this section we prove a theorem that Rogers~\cite{Rogers87}
+credits to Kleene, but admits that it is a special case and not the original
+formulation. We follow Wikipedia~\cite{wiki-krt} and call it the Rogers's
+fixed-point theorem.\<close>
+
+lemma s11_inj: "inj (\<lambda>x. smn 1 p [x])"
+proof
+  fix x\<^sub>1 x\<^sub>2 :: nat
+  assume "smn 1 p [x\<^sub>1] = smn 1 p [x\<^sub>2]"
+  then have "list_encode [code_constn 1 p, code_constn 1 x\<^sub>1, code_id 1 0] =
+      list_encode [code_constn 1 p, code_constn 1 x\<^sub>2, code_id 1 0]"
+    using smn_def by (simp add: prod_encode_eq)
+  then have "[code_constn 1 p, code_constn 1 x\<^sub>1, code_id 1 0] =
+      [code_constn 1 p, code_constn 1 x\<^sub>2, code_id 1 0]"
+    using list_decode_encode by metis
+  then have "code_constn 1 x\<^sub>1 = code_constn 1 x\<^sub>2" by simp
+  then show "x\<^sub>1 = x\<^sub>2"
+    using code_const1 code_constn code_constn_def encode_injective r_constn
+    by (metis One_nat_def length_Cons list.size(3) option.simps(1))
+qed
+
+definition "r_univuniv \<equiv> Cn 2 r_phi [Cn 2 r_phi [Id 2 0, Id 2 0], Id 2 1]"
+
+lemma r_univuniv_recfn: "recfn 2 r_univuniv"
+  by (simp add: r_univuniv_def)
+
+lemma r_univuniv_converg:
+  assumes "eval r_phi [x, x] \<down>"
+  shows "eval r_univuniv [x, y] = eval r_phi [the (eval r_phi [x, x]), y]"
+  unfolding r_univuniv_def using assms r_univuniv_recfn r_phi_recfn by simp
+
+text \<open>Strictly speaking this is a generalization of Rogers's theorem in
+that it shows the existence of infinitely many fixed-points. In conventional
+terms it says that for every total recursive $f$ and $k \in \mathbb{N}$ there is
+an $n \geq k$ with $\varphi_n = \varphi_{f(n)}$.\<close>
+
+theorem rogers_fixed_point_theorem:
+  fixes k :: nat
+  assumes "recfn 1 f" and "total f"
+  shows "\<exists>n\<ge>k. \<forall>x. eval r_phi [n, x] = eval r_phi [the (eval f [n]), x]"
+proof -
+  let ?p = "encode r_univuniv"
+  define h where "h = Cn 1 (r_smn 1 1) [r_const ?p, Id 1 0]"
+  then have "prim_recfn 1 h"
+    by simp
+  then have "total h"
+    by blast
+  have "eval h [x] = eval (Cn 1 (r_smn 1 1) [r_const ?p, Id 1 0]) [x]" for x
+    unfolding h_def by simp
+  then have h: "the (eval h [x]) = smn 1 ?p [x]" for x
+    by (simp add: r_smn)
+
+  have "eval r_phi [the (eval h [x]), y] = eval r_univuniv [x, y]" for x y
+  proof -
+    have "eval r_phi [the (eval h [x]), y] = eval r_phi [smn 1 ?p [x], y]"
+      using h by simp
+    also have "... = eval r_phi [the (eval (r_smn 1 1) [?p, x]), y]"
+      by (simp add: r_smn)
+    also have "... = eval (r_universal 2) [?p, x, y]"
+      using r_phi_def smn_lemma[of 1 "[x]" 1 "[y]" ?p]
+      by (metis Cons_eq_append_conv One_nat_def Suc_1 length_Cons
+        less_numeral_extra(1) list.size(3) plus_1_eq_Suc)
+    finally show "eval r_phi [the (eval h [x]), y] = eval r_univuniv [x, y]"
+      using r_universal r_univuniv_recfn by simp
+  qed
+  then have *: "eval r_phi [the (eval h [x]), y] = eval r_phi [the (eval r_phi [x, x]), y]"
+      if "eval r_phi [x, x] \<down>" for x y
+    using r_univuniv_converg that by simp
+
+  let ?fh = "Cn 1 f [h]"
+  have "recfn 1 ?fh"
+    using `prim_recfn 1 h` assms by simp
+  then have "infinite {r. recfn 1 r \<and> r \<simeq> ?fh}"
+    using exteq_infinite[of ?fh 1] by simp
+  then have "infinite (encode ` {r. recfn 1 r \<and> r \<simeq> ?fh})" (is "infinite ?E")
+    using encode_injective by (meson finite_imageD inj_onI)
+  then have "infinite ((\<lambda>x. smn 1 ?p [x]) ` ?E)"
+    using s11_inj[of ?p] by (simp add: finite_image_iff inj_on_subset)
+  moreover have "(\<lambda>x. smn 1 ?p [x]) ` ?E = {smn 1 ?p [encode r] |r. recfn 1 r \<and> r \<simeq> ?fh}"
+    by auto
+  ultimately have "infinite {smn 1 ?p [encode r] |r. recfn 1 r \<and> r \<simeq> ?fh}"
+    by simp
+  then obtain n where "n \<ge> k" "n \<in> {smn 1 ?p [encode r] |r. recfn 1 r \<and> r \<simeq> ?fh}"
+    by (meson finite_nat_set_iff_bounded_le le_cases)
+  then obtain r where r: "recfn 1 r" "n = smn 1 ?p [encode r]" "recfn 1 r \<and> r \<simeq> ?fh"
+    by auto
+  then have eval_r: "eval r [encode r] = eval ?fh [encode r]"
+    by (simp add: exteq_def)
+  then have eval_r': "eval r [encode r] = eval f [the (eval h [encode r])]"
+    using assms `total h` `prim_recfn 1 h` by simp
+  then have "eval r [encode r] \<down>"
+    using  `prim_recfn 1 h` assms(1,2) by simp
+  then have "eval r_phi [encode r, encode r] \<down>"
+    by (simp add: \<open>recfn 1 r\<close> r_phi)
+  then have "eval r_phi [the (eval h [encode r]), y] =
+      eval r_phi [(the (eval r_phi [encode r, encode r])), y]"
+      for y
+    using * by simp
+  then have "eval r_phi [the (eval h [encode r]), y] =
+      eval r_phi [(the (eval r [encode r])), y]"
+      for y
+    by (simp add: \<open>recfn 1 r\<close> r_phi)
+  moreover have "n = the (eval h [encode r])" by (simp add: h r(2))
+  ultimately have "eval r_phi [n, y] = eval r_phi [the (eval r [encode r]), y]" for y
+    by simp
+  then have "eval r_phi [n, y] = eval r_phi [the (eval ?fh [encode r]), y]" for y
+    using r by (simp add: eval_r)
+  moreover have "eval ?fh [encode r] = eval f [n]"
+    using eval_r eval_r' \<open>n = the (eval h [encode r])\<close> by auto 
+  ultimately have "eval r_phi [n, y] = eval r_phi [the (eval f [n]), y]" for y
+    by simp
+  with `n \<ge> k` show ?thesis by auto
+qed
+
+
+subsection \<open>Kleene's fixed-point theorem\<close>
+
+text \<open>The next theorem is what Rogers~\cite[p.~214]{Rogers87} calls
+Kleene's version of what we call Rogers's fixed-point theorem. More precisely
+this would be Kleene's \emph{second} fixed-point theorem, but since we do not
+cover the first one, we leave out the number.\<close>
+
+theorem kleene_fixed_point_theorem:
+  fixes k :: nat
+  assumes "recfn 2 psi"
+  shows "\<exists>n\<ge>k. \<forall>x. eval r_phi [n, x] = eval psi [n, x]"
+proof -
+  from numbering_translation[OF assms] obtain c where c:
+    "recfn 1 c"
+    "total c"
+    "\<forall>i x. eval psi [i, x] = eval r_phi [the (eval c [i]), x]"
+    by auto
+  then obtain n where "n \<ge> k" and "\<forall>x. eval r_phi [n, x] = eval r_phi [the (eval c [n]), x]"
+    using rogers_fixed_point_theorem by blast
+  with c(3) have "\<forall>x. eval r_phi [n, x] = eval psi [n, x]"
+    by simp
+  with `n \<ge> k` show ?thesis by auto
+qed
+
+text \<open>Kleene's fixed-point theorem can be generalized to arbitrary
+arities. But we need to generalize it only to binary functions in order to
+show Smullyan's double fixed-point theorem in
+Section~\ref{s:smullyan}.\<close>
+
+definition "r_univuniv2 \<equiv>
+  Cn 3 r_phi [Cn 3 (r_universal 2) [Id 3 0, Id 3 0, Id 3 1], Id 3 2]"
+
+lemma r_univuniv2_recfn: "recfn 3 r_univuniv2"
+  by (simp add: r_univuniv2_def)
+
+lemma r_univuniv2_converg:
+  assumes "eval (r_universal 2) [u, u, x] \<down>"
+  shows "eval r_univuniv2 [u, x, y] = eval r_phi [the (eval (r_universal 2) [u, u, x]), y]"
+  unfolding r_univuniv2_def using assms r_univuniv2_recfn by simp
+
+theorem kleene_fixed_point_theorem_2:
+  assumes "recfn 2 f" and "total f"
+  shows "\<exists>n.
+    recfn 1 n \<and>
+    total n \<and>
+    (\<forall>x y. eval r_phi [(the (eval n [x])), y] = eval r_phi [(the (eval f [the (eval n [x]), x])), y])"
+proof -
+  let ?p = "encode r_univuniv2"
+  let ?s = "r_smn 1 2"
+  define h where "h = Cn 2 ?s [r_dummy 1 (r_const ?p), Id 2 0, Id 2 1]"
+  then have [simp]: "prim_recfn 2 h" by simp
+  {
+    fix u x y
+    have "eval h [u, x] = eval (Cn 2 ?s [r_dummy 1 (r_const ?p), Id 2 0, Id 2 1]) [u, x]"
+      using h_def by simp
+    then have "the (eval h [u, x]) = smn 1 ?p [u, x]"
+      by (simp add: r_smn)
+    then have "eval r_phi [the (eval h [u, x]), y] = eval r_phi [smn 1 ?p [u, x], y]"
+      by simp
+    also have "... =
+      eval r_phi
+        [encode (Cn 1 (r_universal 3) (r_constn 0 ?p # r_constn 0 u # r_constn 0 x # [Id 1 0])),
+         y]"
+      using smn[of 1 ?p "[u, x]"] by (simp add: numeral_3_eq_3)
+    also have "... =
+      eval r_phi
+        [encode (Cn 1 (r_universal 3) (r_const ?p # r_const u # r_const x # [Id 1 0])), y]"
+        (is "_ = eval r_phi [encode ?f, y]")
+      by (simp add: r_constn_def)
+    also have "... = eval ?f [y]"
+      using r_phi'[of ?f] by auto
+    also have "... = eval (r_universal 3) [?p, u, x, y]"
+      using r_univuniv2_recfn r_universal r_phi by auto
+    also have "... = eval r_univuniv2 [u, x, y]"
+      using r_universal by (simp add: r_univuniv2_recfn)
+    finally have "eval r_phi [the (eval h [u, x]), y] =  eval r_univuniv2 [u, x, y]" .
+  }
+  then have *: "eval r_phi [the (eval h [u, x]), y] =
+      eval r_phi [the (eval (r_universal 2) [u, u, x]), y]"
+      if "eval (r_universal 2) [u, u, x] \<down>" for u x y
+    using r_univuniv2_converg that by simp
+
+  let ?fh = "Cn 2 f [h, Id 2 1]"
+  let ?e = "encode ?fh"
+  have "recfn 2 ?fh"
+    using assms by simp
+  have "total h"
+    by auto
+  then have "total ?fh"
+    using assms Cn_total totalI2[of ?fh] by fastforce
+
+  let ?n = "Cn 1 h [r_const ?e, Id 1 0]"
+  have "recfn 1 ?n"
+    using assms by simp
+  moreover have "total ?n"
+    using `total h` totalI1[of ?n] by simp
+  moreover {
+    fix x y
+    have "eval r_phi [(the (eval ?n [x])), y] = eval r_phi [(the (eval h [?e, x])), y]"
+      by simp
+    also have "... = eval r_phi [the (eval (r_universal 2) [?e, ?e, x]), y]"
+      using * r_universal[of _ 2] totalE[of ?fh 2] \<open>total ?fh\<close> \<open>recfn 2 ?fh\<close> 
+      by (metis length_Cons list.size(3) numeral_2_eq_2)
+    also have "... = eval r_phi [the (eval f [the (eval h [?e, x]), x]), y]"
+    proof -
+      have "eval (r_universal 2) [?e, ?e, x] \<down>"
+        using totalE[OF `total ?fh`] `recfn 2 ?fh` r_universal
+        by (metis length_Cons list.size(3) numeral_2_eq_2)
+      moreover have "eval (r_universal 2) [?e, ?e, x] = eval ?fh [?e, x]"
+        by (metis \<open>recfn 2 ?fh\<close> length_Cons list.size(3) numeral_2_eq_2 r_universal)
+      then show ?thesis using assms `total h` by simp
+    qed
+    also have "... =  eval r_phi [(the (eval f [the (eval ?n [x]), x])), y]"
+      by simp
+    finally have "eval r_phi [(the (eval ?n [x])), y] =
+      eval r_phi [(the (eval f [the (eval ?n [x]), x])), y]" .
+  }
+  ultimately show ?thesis by blast
+qed
+
+
+subsection \<open>Smullyan's double fixed-point theorem\label{s:smullyan}\<close>
+
+theorem smullyan_double_fixed_point_theorem:
+  assumes "recfn 2 g" and "total g" and "recfn 2 h" and "total h"
+  shows "\<exists>m n.
+    (\<forall>x. eval r_phi [m, x] = eval r_phi [the (eval g [m, n]), x]) \<and>
+    (\<forall>x. eval r_phi [n, x] = eval r_phi [the (eval h [m, n]), x])"
+proof -
+  obtain m where
+    "recfn 1 m" and
+    "total m" and
+    m: "\<forall>x y. eval r_phi [the (eval m [x]), y] =
+      eval r_phi [the (eval g [the (eval m [x]), x]), y]"
+    using kleene_fixed_point_theorem_2[of g] assms(1,2) by auto
+  define k where "k = Cn 1 h [m, Id 1 0]"
+  then have "recfn 1 k"
+    using `recfn 1 m` assms(3) by simp
+  have "total (Id 1 0)"
+    by (simp add: Mn_free_imp_total)
+  then have "total k"
+    using `total m` assms(4) Cn_total k_def `recfn 1 k` by simp
+  obtain n where n: "\<forall>x. eval r_phi [n, x] = eval r_phi [the (eval k [n]), x]"
+    using rogers_fixed_point_theorem[of k] `recfn 1 k` `total k` by blast
+  obtain mm where mm: "eval m [n] \<down>= mm"
+    using `total m` `recfn 1 m` by fastforce
+  then have "\<forall>x. eval r_phi [mm, x] = eval r_phi [the (eval g [mm, n]), x]"
+    by (metis m option.sel)
+  moreover have "\<forall>x. eval r_phi [n, x] = eval r_phi [the (eval h [mm, n]), x]"
+    using k_def assms(3) `total m` `recfn 1 m` mm n by simp
+  ultimately show ?thesis by blast
+qed
+
+
+section \<open>Decidable and recursively enumerable sets\label{s:decidable}\<close>
+
+text \<open>We defined @{term decidable} already back in
+Section~\ref{s:halting}: @{thm[display] decidable_def}\<close>
+
+text \<open>The next theorem is adapted from @{thm[source]
+halting_problem_undecidable}.\<close>
+
+theorem halting_problem_phi_undecidable: "\<not> decidable {x. eval r_phi [x, x] \<down>}"
+  (is "\<not> decidable ?K")
+proof
+  assume "decidable ?K"
+  then obtain f where "recfn 1 f" and f: "\<forall>x. eval f [x] \<down>= (if x \<in> ?K then 1 else 0)"
+    using decidable_def by auto
+  define g where "g \<equiv> Cn 1 r_ifeq_else_diverg [f, Z, Z]"
+  then have "recfn 1 g"
+    using `recfn 1 f` r_ifeq_else_diverg_recfn by simp
+  then obtain i where i: "eval r_phi [i, x] = eval g [x]" for x
+    using r_phi' by auto
+  from g_def have "eval g [x] = (if x \<notin> ?K then Some 0 else None)" for x
+    using r_ifeq_else_diverg_recfn `recfn 1 f` f by simp
+  then have "eval g [i] \<down> \<longleftrightarrow> i \<notin> ?K" by simp
+  also have "... \<longleftrightarrow> eval r_phi [i, i] \<up>" by simp
+  also have "... \<longleftrightarrow> eval g [i] \<up>"
+    using i by simp
+  finally have "eval g [i] \<down> \<longleftrightarrow> eval g [i] \<up>" .
+  then show False by auto
+qed
+
+lemma decidable_complement: "decidable X \<Longrightarrow> decidable (- X)"
+proof -
+  assume "decidable X"
+  then obtain f where f: "recfn 1 f" "\<forall>x. eval f [x] \<down>= (if x \<in> X then 1 else 0)"
+    using decidable_def by auto
+  define g where "g = Cn 1 r_not [f]"
+  then have "recfn 1 g"
+    by (simp add: f(1))
+  moreover have "eval g [x] \<down>= (if x \<in> X then 0 else 1)" for x
+    by (simp add: g_def f)
+  ultimately show ?thesis using decidable_def by auto
+qed
+
+text \<open>Finite sets are decidable.\<close>
+
+fun r_contains :: "nat list \<Rightarrow> recf" where
+  "r_contains [] = Z"
+| "r_contains (x # xs) = Cn 1 r_ifeq [Id 1 0, r_const x, r_const 1, r_contains xs]"
+
+lemma r_contains_prim: "prim_recfn 1 (r_contains xs)"
+  by (induction xs) auto
+
+lemma r_contains: "eval (r_contains xs) [x] \<down>= (if x \<in> set xs then 1 else 0)"
+proof (induction xs arbitrary: x)
+  case Nil
+  then show ?case by simp
+next
+  case (Cons a xs)
+  have "eval (r_contains (a # xs)) [x] = eval r_ifeq [x, a, 1, the (eval (r_contains xs) [x])]"
+    using r_contains_prim prim_recfn_total by simp
+  also have "... \<down>= (if x = a then 1 else if x \<in> set xs then 1 else 0)"
+    using Cons.IH by simp
+  also have "... \<down>= (if x = a \<or> x \<in> set xs then 1 else 0)"
+    by simp
+  finally show ?case by simp
+qed
+
+lemma finite_set_decidable: "finite X \<Longrightarrow> decidable X"
+proof -
+  fix X :: "nat set"
+  assume "finite X"
+  then obtain xs where "X = set xs"
+    using finite_list by auto
+  then have "\<forall>x. eval (r_contains xs) [x] \<down>= (if x \<in> X then 1 else 0)"
+    using r_contains by simp
+  then show "decidable X"
+    using decidable_def r_contains_prim by blast
+qed
+
+definition semidecidable :: "nat set \<Rightarrow> bool" where
+  "semidecidable X \<equiv> (\<exists>f. recfn 1 f \<and> (\<forall>x. eval f [x] = (if x \<in> X then Some 1 else None)))"
+
+text \<open>The semidecidable sets are the domains of partial recursive functions.\<close>
+
+lemma semidecidable_iff_domain:
+  "semidecidable X \<longleftrightarrow> (\<exists>f. recfn 1 f \<and> (\<forall>x. eval f [x] \<down> \<longleftrightarrow> x \<in> X))"
+proof
+  show "semidecidable X \<Longrightarrow> \<exists>f. recfn 1 f \<and> (\<forall>x. (eval f [x] \<down>) = (x \<in> X))"
+    using semidecidable_def by (metis option.distinct(1))
+  show "semidecidable X" if "\<exists>f. recfn 1 f \<and> (\<forall>x. (eval f [x] \<down>) = (x \<in> X))" for X
+  proof -
+    from that obtain f where f: "recfn 1 f" "\<forall>x. (eval f [x] \<down>) = (x \<in> X)"
+      by auto
+    let ?g = "Cn 1 (r_const 1) [f]"
+    have "recfn 1 ?g"
+      using f(1) by simp
+    moreover have "\<forall>x. eval ?g [x] = (if x \<in> X then Some 1 else None)"
+      using f by simp
+    ultimately show "semidecidable X"
+      using semidecidable_def by blast
+  qed
+qed
+
+lemma decidable_imp_semidecidable: "decidable X \<Longrightarrow> semidecidable X"
+proof -
+  assume "decidable X"
+  then obtain f where f: "recfn 1 f" "\<forall>x. eval f [x] \<down>= (if x \<in> X then 1 else 0)"
+    using decidable_def by auto
+  define g where "g = Cn 1 r_ifeq_else_diverg [f, r_const 1, r_const 1]"
+  then have "recfn 1 g"
+    by (simp add: f(1))
+  have "eval g [x] = eval r_ifeq_else_diverg [if x \<in> X then 1 else 0, 1, 1]" for x
+    by (simp add: g_def f)
+  then have "\<And>x. x \<in> X \<Longrightarrow> eval g [x] \<down>= 1" and "\<And>x. x \<notin> X \<Longrightarrow> eval g [x] \<up>"
+    by simp_all
+  then show ?thesis
+    using `recfn 1 g` semidecidable_def by auto
+qed
+
+text \<open>A set is recursively enumerable if it is empty or the image of a
+total recursive function.\<close>
+
+definition recursively_enumerable :: "nat set \<Rightarrow> bool" where
+  "recursively_enumerable X \<equiv>
+     X = {} \<or> (\<exists>f. recfn 1 f \<and> total f \<and> X = {the (eval f [x]) |x. x \<in> UNIV})"
+
+theorem recursively_enumerable_iff_semidecidable:
+  "recursively_enumerable X \<longleftrightarrow> semidecidable X"
+proof
+  show "semidecidable X" if "recursively_enumerable X" for X
+  proof (cases)
+    assume "X = {}"
+    then show ?thesis
+      using finite_set_decidable decidable_imp_semidecidable
+        recursively_enumerable_def semidecidable_def
+      by blast
+  next
+    assume "X \<noteq> {}"
+    with that obtain f where f: "recfn 1 f" "total f" "X = {the (eval f [x]) |x. x \<in> UNIV}"
+      using recursively_enumerable_def by blast
+    define h where "h = Cn 2 r_eq [Cn 2 f [Id 2 0], Id 2 1]"
+    then have "recfn 2 h"
+      using f(1) by simp
+    from h_def have h: "eval h [x, y] \<down>= 0 \<longleftrightarrow> the (eval f [x]) = y" for x y
+      using f(1,2) by simp
+    from h_def `recfn 2 h` totalI2 f(2) have "total h" by simp
+    define g where "g = Mn 1 h"
+    then have "recfn 1 g"
+      using h_def f(1) by simp
+    then have "eval g [y] =
+      (if (\<exists>x. eval h [x, y] \<down>= 0 \<and> (\<forall>x'<x. eval h [x', y] \<down>))
+       then Some (LEAST x. eval h [x, y] \<down>= 0)
+       else None)" for y
+      using g_def `total h` f(2) by simp
+    then have "eval g [y] =
+      (if \<exists>x. eval h [x, y] \<down>= 0
+       then Some (LEAST x. eval h [x, y] \<down>= 0)
+       else None)" for y
+      using `total h` `recfn 2 h` by simp
+    then have "eval g [y] \<down> \<longleftrightarrow> (\<exists>x. eval h [x, y] \<down>= 0)" for y
+      by simp
+    with h have "eval g [y] \<down> \<longleftrightarrow> (\<exists>x. the (eval f [x]) = y)" for y
+      by simp
+    with f(3) have "eval g [y] \<down> \<longleftrightarrow> y \<in> X" for y
+      by auto
+    with `recfn 1 g` semidecidable_iff_domain show ?thesis by auto
+  qed
+
+  show "recursively_enumerable X" if "semidecidable X" for X
+  proof (cases)
+    assume "X = {}"
+    then show ?thesis using recursively_enumerable_def by simp
+  next
+    assume "X \<noteq> {}"
+    then obtain x\<^sub>0 where "x\<^sub>0 \<in> X" by auto
+    from that semidecidable_iff_domain obtain f where f: "recfn 1 f" "\<forall>x. eval f [x] \<down> \<longleftrightarrow> x \<in> X"
+      by auto
+    let ?i = "encode f"
+    have i: "\<And>x. eval f [x] = eval r_phi [?i, x]"
+      using r_phi' f(1) by simp
+    with `x\<^sub>0 \<in> X` f(2) have "eval r_phi [?i, x\<^sub>0] \<down>" by simp
+    then obtain g where g: "recfn 1 g" "total g" "\<forall>x. eval r_phi [?i, x] \<down> = (\<exists>y. eval g [y] \<down>= x)"
+      using f(1) nonempty_domain_enumerable by blast
+    with f(2) i have "\<forall>x. x \<in> X = (\<exists>y. eval g [y] \<down>= x)"
+      by simp
+    then have "\<forall>x. x \<in> X = (\<exists>y. the (eval g [y]) = x)"
+      using totalE[OF g(2) g(1)]
+      by (metis One_nat_def length_Cons list.size(3) option.collapse option.sel)
+    then have "X = {the (eval g [y]) |y. y \<in> UNIV}"
+      by auto
+    with g(1,2) show ?thesis using recursively_enumerable_def by auto
+  qed
+qed
+
+text \<open>The next goal is to show that a set is decidable iff. it and its
+complement are semidecidable. For this we use the concurrent evaluation
+function.\<close>
+
+lemma semidecidable_decidable:
+  assumes "semidecidable X" and "semidecidable (- X)"
+  shows "decidable X"
+proof -
+  obtain f where f: "recfn 1 f \<and> (\<forall>x. eval f [x] \<down> \<longleftrightarrow> x \<in> X)"
+    using assms(1) semidecidable_iff_domain by auto
+  let ?i = "encode f"
+  obtain g where g: "recfn 1 g \<and> (\<forall>x. eval g [x] \<down> \<longleftrightarrow> x \<in> (- X))"
+    using assms(2) semidecidable_iff_domain by auto
+  let ?j = "encode g"
+  define d where "d = Cn 1 r_pdec1 [Cn 1 r_parallel [r_const ?j, r_const ?i, Id 1 0]]"
+  then have "recfn 1 d"
+    by (simp add: d_def)
+  have *: "\<And>x. eval r_phi [?i, x] = eval f [x]" "\<And>x. eval r_phi [?j, x] = eval g [x]"
+    using f g r_phi' by simp_all
+  have "eval d [x] \<down>= 1" if "x \<in> X" for x
+  proof -
+    have "eval f [x] \<down>"
+      using f that by simp
+    moreover have "eval g [x] \<up>"
+      using g that by blast
+    ultimately have "eval r_parallel [?j, ?i, x] \<down>= prod_encode (1, the (eval f [x]))"
+      using * r_parallel(3) by simp
+    with d_def show ?thesis by simp
+  qed
+  moreover have "eval d [x] \<down>= 0" if "x \<notin> X" for x
+  proof -
+    have "eval g [x] \<down>"
+      using g that by simp
+    moreover have "eval f [x] \<up>"
+      using f that by blast
+    ultimately have "eval r_parallel [?j, ?i, x] \<down>= prod_encode (0, the (eval g [x]))"
+      using * r_parallel(2) by blast
+    with d_def show ?thesis by simp
+  qed
+  ultimately show ?thesis
+    using decidable_def `recfn 1 d` by auto
+qed
+
+theorem decidable_iff_semidecidable_complement:
+  "decidable X \<longleftrightarrow> semidecidable X \<and> semidecidable (- X)"
+  using semidecidable_decidable decidable_imp_semidecidable decidable_complement
+  by blast
+
+
+section \<open>Rice's theorem\<close>
+
+definition index_set :: "nat set \<Rightarrow> bool" where
+  "index_set I \<equiv> \<forall>i j. i \<in> I \<and> (\<forall>x. eval r_phi [i, x] = eval r_phi [j, x]) \<longrightarrow> j \<in> I"
+
+lemma index_set_closed_in:
+  assumes "index_set I" and "i \<in> I" and "\<forall>x. eval r_phi [i, x] = eval r_phi [j, x]"
+  shows "j \<in> I"
+  using index_set_def assms by simp
+
+lemma index_set_closed_not_in:
+  assumes "index_set I" and "i \<notin> I" and "\<forall>x. eval r_phi [i, x] = eval r_phi [j, x]"
+  shows "j \<notin> I"
+  using index_set_def assms by metis
+
+theorem rice_theorem:
+  assumes "index_set I" and "I \<noteq> UNIV" and "I \<noteq> {}"
+  shows "\<not> decidable I"
+proof
+  assume "decidable I"
+  then obtain d where d: "recfn 1 d" "\<forall>i. eval d [i] \<down>= (if i \<in> I then 1 else 0)"
+    using decidable_def by auto
+  obtain j\<^sub>1 j\<^sub>2 where "j\<^sub>1 \<notin> I" and "j\<^sub>2 \<in> I"
+    using assms(2,3) by auto
+  let ?if = "Cn 2 r_ifz [Cn 2 d [Id 2 0], r_dummy 1 (r_const j\<^sub>2), r_dummy 1 (r_const j\<^sub>1)]"
+  define psi where "psi = Cn 2 r_phi [?if, Id 2 1] "
+  then have "recfn 2 psi"
+    by (simp add: d)
+  have "eval ?if [x, y] = Some (if x \<in> I then j\<^sub>1 else j\<^sub>2)" for x y
+    by (simp add: d)
+  moreover have "eval psi [x, y] = eval (Cn 2 r_phi [?if, Id 2 1]) [x, y]" for x y
+    using psi_def by simp
+  ultimately have psi: "eval psi [x, y] = eval r_phi [if x \<in> I then j\<^sub>1 else j\<^sub>2, y]" for x y
+    by (simp add: d)
+  then have in_I: "eval psi [x, y] = eval r_phi [j\<^sub>1, y]" if "x \<in> I" for x y
+    by (simp add: that)
+  have not_in_I: "eval psi [x, y] = eval r_phi [j\<^sub>2, y]" if "x \<notin> I" for x y
+    by (simp add: psi that)
+  obtain n where n: "\<forall>x. eval r_phi [n, x] = eval psi [n, x]"
+    using kleene_fixed_point_theorem[OF `recfn 2 psi`] by auto
+  show False
+  proof cases
+    assume "n \<in> I"
+    then have "\<forall>x. eval r_phi [n, x] = eval r_phi [j\<^sub>1, x]"
+      using n in_I by simp
+    then have "n \<notin> I"
+      using `j\<^sub>1 \<notin> I` index_set_closed_not_in[OF assms(1)] by simp
+    with `n \<in> I` show False by simp
+  next
+    assume "n \<notin> I"
+    then have "\<forall>x. eval r_phi [n, x] = eval r_phi [j\<^sub>2, x]"
+      using n not_in_I by simp
+    then have "n \<in> I"
+      using `j\<^sub>2 \<in> I` index_set_closed_in[OF assms(1)] by simp
+    with `n \<notin> I` show False by simp
+  qed
+qed
+
+
+section \<open>Partial recursive functions as actual functions\label{s:alternative}\<close>
+
+text \<open>A well-formed @{typ recf} describes an algorithm. Usually,
+however, partial recursive functions are considered to be partial functions,
+that is, right-unique binary relations. This distinction did not matter much
+until now, because we were mostly concerned with the \emph{existence} of
+partial recursive functions, which is equivalent to the existence of
+algorithms. Whenever it did matter, we could use the extensional equivalence
+@{term "exteq"}. In Chapter~\ref{c:iirf}, however, we will deal with sets of
+functions and sets of sets of functions.
+
+For illustration consider the singleton set containing only the unary zero
+function. It could be expressed by @{term "{Z}"}, but this would not contain
+@{term[names_short] "Cn 1 (Id 1 0) [Z]"}, which computes the same function.
+The alternative representation as @{term "{f. f \<simeq> Z}"} is not a
+singleton set. Another alternative would be to identify partial recursive
+functions with the equivalence classes of @{term "exteq"}. This would work
+for all arities. But since we will only need unary and binary functions, we
+can go for the less general but simpler alternative of regarding partial
+recursive functions as certain functions of types @{typ "nat \<Rightarrow>
+nat option"} and @{typ "nat \<Rightarrow> nat \<Rightarrow> nat option"}.
+With this notation we can represent the aforementioned set by @{term
+"{\<lambda>_. Some (0::nat)}"} and express that the function @{term "\<lambda>_.
+Some (0::nat)"} is total recursive.
+
+In addition terms get shorter, for instance, @{term "eval r_func [i, x]"}
+becomes @{term "func i x"}.\<close>
+
+
+subsection \<open>The definitions\<close>
+
+type_synonym partial1 = "nat \<Rightarrow> nat option"
+
+type_synonym partial2 = "nat \<Rightarrow> nat \<Rightarrow> nat option"
+
+definition total1 :: "partial1 \<Rightarrow> bool" where
+  "total1 f \<equiv> \<forall>x. f x \<down>"
+
+definition total2 :: "partial2 \<Rightarrow> bool" where
+  "total2 f \<equiv> \<forall>x y. f x y \<down>"
+
+lemma total1I [intro]: "(\<And>x. f x \<down>) \<Longrightarrow> total1 f"
+  using total1_def by simp
+
+lemma total2I [intro]: "(\<And>x y. f x y \<down>) \<Longrightarrow> total2 f"
+  using total2_def by simp
+
+lemma total1E [dest, simp]: "total1 f \<Longrightarrow> f x \<down>"
+  using total1_def by simp
+
+lemma total2E [dest, simp]: "total2 f \<Longrightarrow> f x y \<down>"
+  using total2_def by simp
+
+definition P1 :: "partial1 set" ("\<P>") where
+  "\<P> \<equiv> {\<lambda>x. eval r [x] |r. recfn 1 r}"
+
+definition P2 :: "partial2 set" ("\<P>\<^sup>2") where
+  "\<P>\<^sup>2 \<equiv> {\<lambda>x y. eval r [x, y] |r. recfn 2 r}"
+
+definition R1 :: "partial1 set" ("\<R>") where
+  "\<R> \<equiv> {\<lambda>x. eval r [x] |r. recfn 1 r \<and> total r}"
+
+definition R2 :: "partial2 set" ("\<R>\<^sup>2") where
+  "\<R>\<^sup>2 \<equiv> {\<lambda>x y. eval r [x, y] |r. recfn 2 r \<and> total r}"
+
+definition Prim1 :: "partial1 set" where
+  "Prim1 \<equiv> {\<lambda>x. eval r [x] |r. prim_recfn 1 r}"
+
+definition Prim2 :: "partial2 set" where
+  "Prim2 \<equiv> {\<lambda>x y. eval r [x, y] |r. prim_recfn 2 r}"
+
+lemma R1_imp_P1 [simp, elim]: "f \<in> \<R> \<Longrightarrow> f \<in> \<P>"
+  using R1_def P1_def by auto
+
+lemma R2_imp_P2 [simp, elim]: "f \<in> \<R>\<^sup>2 \<Longrightarrow> f \<in> \<P>\<^sup>2"
+  using R2_def P2_def by auto
+
+lemma Prim1_imp_R1 [simp, elim]: "f \<in> Prim1 \<Longrightarrow> f \<in> \<R>"
+  unfolding Prim1_def R1_def by auto
+
+lemma Prim2_imp_R2 [simp, elim]: "f \<in> Prim2 \<Longrightarrow> f \<in> \<R>\<^sup>2"
+  unfolding Prim2_def R2_def by auto
+
+lemma P1E [elim]:
+  assumes "f \<in> \<P>"
+  obtains r where "recfn 1 r" and "\<forall>x. eval r [x] = f x"
+  using assms P1_def by force
+
+lemma P2E [elim]:
+  assumes "f \<in> \<P>\<^sup>2"
+  obtains r where "recfn 2 r" and "\<forall>x y. eval r [x, y] = f x y"
+  using assms P2_def by force
+
+lemma P1I [intro]:
+  assumes "recfn 1 r" and "(\<lambda>x. eval r [x]) = f"
+  shows "f \<in> \<P>"
+  using assms P1_def by auto
+
+lemma P2I [intro]:
+  assumes "recfn 2 r" and "\<And>x y. eval r [x, y] = f x y"
+  shows "f \<in> \<P>\<^sup>2"
+proof -
+  have "(\<lambda>x y. eval r [x, y]) = f"
+    using assms(2) by simp
+  then show ?thesis
+    using assms(1) P2_def by auto
+qed
+
+lemma R1I [intro]:
+  assumes "recfn 1 r" and "total r" and "\<And>x. eval r [x] = f x"
+  shows "f \<in> \<R>"
+  unfolding R1_def
+  using CollectI[of "\<lambda>f. \<exists>r. f = (\<lambda>x. eval r [x]) \<and> recfn 1 r \<and> total r" f] assms
+  by metis
+
+lemma R1E [elim]:
+  assumes "f \<in> \<R>"
+  obtains r where "recfn 1 r" and "total r" and "f = (\<lambda>x. eval r [x])"
+  using assms R1_def by auto
+
+lemma R2I [intro]:
+  assumes "recfn 2 r" and "total r" and "\<And>x y. eval r [x, y] = f x y"
+  shows "f \<in> \<R>\<^sup>2"
+  unfolding R2_def
+  using CollectI[of "\<lambda>f. \<exists>r. f = (\<lambda>x y. eval r [x, y]) \<and> recfn 2 r \<and> total r" f] assms
+  by metis
+
+lemma R1_SOME:
+  assumes "f \<in> \<R>"
+    and "r = (SOME r'. recfn 1 r' \<and>  total r' \<and> f = (\<lambda>x. eval r' [x]))"
+      (is "r = (SOME r'. ?P r')")
+  shows "recfn 1 r"
+    and "\<And>x. eval r [x] \<down>"
+    and "\<And>x. f x = eval r [x]"
+    and "f = (\<lambda>x. eval r [x])"
+proof -
+  obtain r' where "?P r'"
+    using R1E[OF assms(1)] by auto
+  then show "recfn 1 r" "\<And>b. eval r [b] \<down>" "\<And>x. f x = eval r [x]"
+    using someI[of ?P r'] assms(2) totalE[of r] by (auto, metis)
+  then show "f = (\<lambda>x. eval r [x])" by auto
+qed
+
+lemma R2E [elim]:
+  assumes "f \<in> \<R>\<^sup>2"
+  obtains r where "recfn 2 r" and "total r" and "f = (\<lambda>x\<^sub>1 x\<^sub>2. eval r [x\<^sub>1, x\<^sub>2])"
+  using assms R2_def by auto
+
+lemma R1_imp_total1 [simp]: "f \<in> \<R> \<Longrightarrow> total1 f"
+  using total1I by fastforce
+
+lemma R2_imp_total2 [simp]: "f \<in> \<R>\<^sup>2 \<Longrightarrow> total2 f"
+  using totalE by fastforce
+
+lemma Prim1I [intro]:
+  assumes "prim_recfn 1 r" and "\<And>x. f x = eval r [x]"
+  shows "f \<in> Prim1"
+  using assms Prim1_def by blast
+
+lemma Prim2I [intro]:
+  assumes "prim_recfn 2 r" and "\<And>x y. f x y = eval r [x, y]"
+  shows "f \<in> Prim2"
+  using assms Prim2_def by blast
+
+lemma P1_total_imp_R1 [intro]:
+  assumes "f \<in> \<P>" and "total1 f"
+  shows "f \<in> \<R>"
+  using assms totalI1 by force
+
+lemma P2_total_imp_R2 [intro]:
+  assumes "f \<in> \<P>\<^sup>2 " and "total2 f"
+  shows "f \<in> \<R>\<^sup>2"
+  using assms totalI2 by force
+
+
+subsection \<open>Some simple properties\<close>
+
+text \<open>In order to show that a @{typ partial1} or @{typ partial2}
+function is in @{term "\<P>"}, @{term "\<P>\<^sup>2"}, @{term "\<R>"}, @{term
+"\<R>\<^sup>2"}, @{term "Prim1"}, or @{term "Prim2"} we will usually have to
+find a suitable @{typ recf}. But for some simple or frequent cases this
+section provides shortcuts.\<close>
+
+lemma identity_in_R1: "Some \<in> \<R>"
+proof -
+  have "\<forall>x. eval (Id 1 0) [x] \<down>= x" by simp
+  moreover have "recfn 1 (Id 1 0)" by simp
+  moreover have "total (Id 1 0)"
+    by (simp add: totalI1)
+  ultimately show ?thesis by blast
+qed
+
+lemma P2_proj_P1 [simp, elim]:
+  assumes "\<psi> \<in> \<P>\<^sup>2"
+  shows "\<psi> i \<in> \<P>"
+proof -
+  from assms obtain u where u: "recfn 2 u" "(\<lambda>x\<^sub>1 x\<^sub>2. eval u [x\<^sub>1, x\<^sub>2]) = \<psi>"
+    by auto
+  define v where "v \<equiv> Cn 1 u [r_const i, Id 1 0]"
+  then have "recfn 1 v" "(\<lambda>x. eval v [x]) = \<psi> i"
+    using u by auto
+  then show ?thesis by auto
+qed
+
+lemma R2_proj_R1 [simp, elim]:
+  assumes "\<psi> \<in> \<R>\<^sup>2"
+  shows "\<psi> i \<in> \<R>"
+proof -
+  from assms have "\<psi> \<in> \<P>\<^sup>2" by simp
+  then have "\<psi> i \<in> \<P>" by auto
+  moreover have "total1 (\<psi> i)"
+    using assms by (simp add: total1I)
+  ultimately show ?thesis by auto
+qed
+
+lemma const_in_Prim1: "(\<lambda>_. Some c) \<in> Prim1"
+proof -
+  define r where "r = r_const c"
+  then have "\<And>x. eval r [x] = Some c" by simp
+  moreover have "recfn 1 r" "Mn_free r"
+    using r_def by simp_all
+  ultimately show ?thesis by auto
+qed
+
+lemma concat_P1_P1:
+  assumes "f \<in> \<P>" and "g \<in> \<P>"
+  shows "(\<lambda>x. if g x \<down> \<and> f (the (g x)) \<down> then Some (the (f (the (g x)))) else None) \<in> \<P>"
+    (is "?h \<in> \<P>")
+proof -
+  obtain rf where rf: "recfn 1 rf" "\<forall>x. eval rf [x] = f x"
+    using assms(1) by auto
+  obtain rg where rg: "recfn 1 rg" "\<forall>x. eval rg [x] = g x"
+    using assms(2) by auto
+  let ?rh = "Cn 1 rf [rg]"
+  have "recfn 1 ?rh"
+    using rf(1) rg(1) by simp
+  moreover have "eval ?rh [x] = ?h x" for x
+    using rf rg by simp
+  ultimately show ?thesis by blast
+qed
+
+lemma P1_update_P1:
+  assumes "f \<in> \<P>"
+  shows "f(x:=z) \<in> \<P>"
+proof (cases z)
+  case None
+  define re where "re \<equiv> Mn 1 (r_constn 1 1)"
+  from assms obtain r where r: "recfn 1 r" "(\<lambda>u. eval r [u]) = f"
+    by auto
+  define r' where "r' = Cn 1 (r_lifz re r) [Cn 1 r_eq [Id 1 0, r_const x], Id 1 0]"
+  have "recfn 1 r'"
+    using r(1) r'_def re_def by simp
+  then have "eval r' [u] = eval (r_lifz re r) [if u = x then 0 else 1, u]" for u
+    using r'_def by simp
+  with r(1) have "eval r' [u] = (if u = x then None else eval r [u])" for u
+    using re_def re_def by simp
+  with r(2) have "eval r' [u] = (f(x:=None)) u" for u
+    by auto
+  then have "(\<lambda>u. eval r' [u]) = f(x:=None)"
+    by auto
+  with None `recfn 1 r'` show ?thesis by auto
+next
+  case (Some y)
+  from assms obtain r where r: "recfn 1 r" "(\<lambda>u. eval r [u]) = f"
+    by auto
+  define r' where
+    "r' \<equiv> Cn 1 (r_lifz (r_const y) r) [Cn 1 r_eq [Id 1 0, r_const x], Id 1 0]"
+  have "recfn 1 r'"
+    using r(1) r'_def by simp
+  then have "eval r' [u] = eval (r_lifz (r_const y) r) [if u = x then 0 else 1, u]" for u
+    using r'_def by simp
+  with r(1) have "eval r' [u] = (if u = x then Some y else eval r [u])" for u
+    by simp
+  with r(2) have "eval r' [u] = (f(x:=Some y)) u" for u
+    by auto
+  then have "(\<lambda>u. eval r' [u]) = f(x:=Some y)"
+    by auto
+  with Some `recfn 1 r'` show ?thesis by auto
+qed
+
+lemma swap_P2:
+  assumes "f \<in> \<P>\<^sup>2"
+  shows "(\<lambda>x y. f y x) \<in> \<P>\<^sup>2"
+proof -
+  obtain r where r: "recfn 2 r" "\<And>x y. eval r [x, y] = f x y"
+    using assms by auto
+  then have "eval (r_swap r) [x, y] = f y x" for x y
+    by simp
+  moreover have "recfn 2 (r_swap r)"
+    using r_swap_recfn r(1) by simp
+  ultimately show ?thesis by auto
+qed
+
+lemma swap_R2:
+  assumes "f \<in> \<R>\<^sup>2"
+  shows "(\<lambda>x y. f y x) \<in> \<R>\<^sup>2"
+  using swap_P2[of f] assms
+  by (meson P2_total_imp_R2 R2_imp_P2 R2_imp_total2 total2E total2I)
+
+lemma skip_P1:
+  assumes "f \<in> \<P>"
+  shows "(\<lambda>x. f (x + n)) \<in> \<P>"
+proof -
+  obtain r where r: "recfn 1 r" "\<And>x. eval r [x] = f x"
+    using assms by auto
+  let ?s = "Cn 1 r [Cn 1 r_add [Id 1 0, r_const n]]"
+  have "recfn 1 ?s"
+    using r by simp
+  have "eval ?s [x] = eval r [x + n]" for x
+    using r by simp
+  with r have "eval ?s [x] = f (x + n)" for x
+    by simp
+  with `recfn 1 ?s` show ?thesis by blast
+qed
+
+lemma skip_R1:
+  assumes "f \<in> \<R>"
+  shows "(\<lambda>x. f (x + n)) \<in> \<R>"
+  using assms skip_P1 R1_imp_total1 total1_def by auto
+
+
+subsection \<open>The Gödel numbering @{term \<phi>}\label{s:goedel_numbering}\<close>
+
+text \<open>While the term \emph{Gödel numbering} is often used generically for
+mappings between natural numbers and mathematical concepts, the inductive
+inference literature uses it in a more specific sense. There it is equivalent
+to the notion of acceptable numbering~\cite{Rogers87}: For every numbering
+there is a recursive function mapping the numbering's indices to equivalent
+ones of a Gödel numbering.\<close>
+
+definition goedel_numbering :: "partial2 \<Rightarrow> bool" where
+  "goedel_numbering \<psi> \<equiv> \<psi> \<in> \<P>\<^sup>2 \<and> (\<forall>\<chi>\<in>\<P>\<^sup>2. \<exists>c\<in>\<R>. \<forall>i. \<chi> i = \<psi> (the (c i)))"
+
+lemma goedel_numbering_P2:
+  assumes "goedel_numbering \<psi>"
+  shows "\<psi> \<in> \<P>\<^sup>2"
+  using goedel_numbering_def assms by simp
+
+lemma goedel_numberingE:
+  assumes "goedel_numbering \<psi>" and "\<chi> \<in> \<P>\<^sup>2"
+  obtains c where "c \<in> \<R>" and "\<forall>i. \<chi> i = \<psi> (the (c i))"
+  using assms goedel_numbering_def by blast
+
+lemma goedel_numbering_universal:
+  assumes "goedel_numbering \<psi>" and "f \<in> \<P>"
+  shows "\<exists>i. \<psi> i = f"
+proof -
+  define \<chi> :: partial2 where "\<chi> = (\<lambda>i. f)"
+  have "\<chi> \<in> \<P>\<^sup>2"
+  proof -
+    obtain rf where rf: "recfn 1 rf" "\<And>x. eval rf [x] = f x"
+      using assms(2) by auto
+    define r where "r = Cn 2 rf [Id 2 1]"
+    then have r: "recfn 2 r" "\<And>i x. eval r [i, x] = eval rf [x]"
+      using rf(1) by simp_all
+    with rf(2) have "\<And>i x. eval r [i, x] = f x" by simp
+    with r(1) show ?thesis using \<chi>_def by auto
+  qed
+  then obtain c where "c \<in> \<R>" and "\<forall>i. \<chi> i = \<psi> (the (c i))"
+    using goedel_numbering_def assms(1) by auto
+  with \<chi>_def show ?thesis by auto
+qed
+
+text \<open>Our standard Gödel numbering is based on @{term r_phi}:\<close>
+
+definition phi :: partial2 ("\<phi>") where
+  "\<phi> i x \<equiv> eval r_phi [i, x]"
+
+lemma phi_in_P2: "\<phi> \<in> \<P>\<^sup>2"
+  unfolding phi_def using r_phi_recfn by blast
+
+text \<open>Indices of any numbering can be translated into equivalent indices
+of @{term phi}, which thus is a Gödel numbering.\<close>
+
+lemma numbering_translation_for_phi:
+  assumes "\<psi> \<in> \<P>\<^sup>2"
+  shows "\<exists>c\<in>\<R>. \<forall>i. \<psi> i = \<phi> (the (c i))"
+proof -
+  obtain psi where psi: "recfn 2 psi" "\<And>i x. eval psi [i, x] = \<psi> i x"
+    using assms by auto
+  with numbering_translation obtain b where
+    "recfn 1 b" "total b" "\<forall>i x. eval psi [i, x] = eval r_phi [the (eval b [i]), x]"
+    by blast
+  moreover from this obtain c where c: "c \<in> \<R>" "\<forall>i. c i = eval b [i]"
+    by fast
+  ultimately have "\<psi> i x = \<phi> (the (c i)) x" for i x
+    using phi_def psi(2) by presburger
+  then have "\<psi> i = \<phi> (the (c i))" for i
+    by auto
+  then show ?thesis using c(1) by blast
+qed
+
+corollary goedel_numbering_phi: "goedel_numbering \<phi>"
+  unfolding goedel_numbering_def using numbering_translation_for_phi phi_in_P2 by simp
+
+corollary phi_universal:
+  assumes "f \<in> \<P>"
+  obtains i where "\<phi> i = f"
+  using goedel_numbering_universal[OF goedel_numbering_phi assms] by auto
+
+
+subsection \<open>Fixed-point theorems\<close>
+
+text \<open>The fixed-point theorems look somewhat cleaner in the new
+notation. We will only need the following ones in the next chapter.\<close>
+
+theorem kleene_fixed_point:
+  fixes k :: nat
+  assumes "\<psi> \<in> \<P>\<^sup>2"
+  obtains i where "i \<ge> k" and "\<phi> i = \<psi> i"
+proof -
+  obtain r_psi where r_psi: "recfn 2 r_psi" "\<And>i x. eval r_psi [i, x] = \<psi> i x"
+    using assms by auto
+  then obtain i where i: "i \<ge> k" "\<forall>x. eval r_phi [i, x] = eval r_psi [i, x]"
+    using kleene_fixed_point_theorem by blast
+  then have "\<forall>x. \<phi> i x = \<psi> i x"
+    using phi_def r_psi by simp
+  then show ?thesis using i that by blast
+qed
+
+theorem smullyan_double_fixed_point:
+  assumes "g \<in> \<R>\<^sup>2" and "h \<in> \<R>\<^sup>2"
+  obtains m n where "\<phi> m = \<phi> (the (g m n))" and "\<phi> n = \<phi> (the (h m n))"
+proof -
+  obtain rg where rg: "recfn 2 rg" "total rg" "g = (\<lambda>x y. eval rg [x, y])"
+    using R2E[OF assms(1)] by auto
+  moreover obtain rh where rh: "recfn 2 rh" "total rh" "h = (\<lambda>x y. eval rh [x, y])"
+    using R2E[OF assms(2)] by auto
+  ultimately obtain m n where
+    "\<forall>x. eval r_phi [m, x] = eval r_phi [the (eval rg [m, n]), x]"
+    "\<forall>x. eval r_phi [n, x] = eval r_phi [the (eval rh [m, n]), x]"
+    using smullyan_double_fixed_point_theorem[of rg rh] by blast
+  then have "\<phi> m = \<phi> (the (g m n))" and "\<phi> n = \<phi> (the (h m n))"
+    using phi_def rg rh by auto
+  then show ?thesis using that by simp
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/TOTAL_CONS.thy b/thys/Inductive_Inference/TOTAL_CONS.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/TOTAL_CONS.thy
@@ -0,0 +1,1468 @@
+section \<open>TOTAL is a proper subset of CONS\label{s:total_cons}\<close>
+
+theory TOTAL_CONS
+  imports Lemma_R  (* for r_auxhyp *)
+    CP_FIN_NUM  (* for r_consistent *)
+    CONS_LIM  (* for rmge2, goedel_at *)
+begin
+
+text \<open>We first show that TOTAL is a subset of CONS. Then we present a
+separating class.\<close>
+
+
+subsection \<open>TOTAL is a subset of CONS\<close>
+
+text \<open>A TOTAL strategy hypothesizes only total functions, for which the
+consistency with the input prefix is decidable. A CONS strategy can thus run
+a TOTAL strategy and check if its hypothesis is consistent. If so, it
+outputs this hypothesis, otherwise some arbitrary consistent one. Since the
+TOTAL strategy converges to a correct hypothesis, which is consistent, the
+CONS strategy will converge to the same hypothesis.\<close>
+
+text \<open>Without loss of generality we can assume that learning takes place
+with respect to our Gödel numbering $\varphi$. So we need to decide
+consistency only for this numbering.\<close>
+
+abbreviation r_consist_phi where
+  "r_consist_phi \<equiv> r_consistent r_phi"
+
+lemma r_consist_phi_recfn [simp]: "recfn 2 r_consist_phi"
+  by simp
+
+lemma r_consist_phi:
+  assumes "\<forall>k<e_length e. \<phi> i k \<down>"
+  shows "eval r_consist_phi [i, e] \<down>=
+    (if \<forall>k<e_length e. \<phi> i k \<down>= e_nth e k then 0 else 1)"
+proof -
+  have "\<forall>k<e_length e. eval r_phi [i, k] \<down>"
+    using assms phi_def by simp
+  moreover have "recfn 2 r_phi" by simp
+  ultimately have "eval (r_consistent r_phi) [i, e] \<down>=
+     (if \<forall>k<e_length e. eval r_phi [i, k] \<down>= e_nth e k then 0 else 1)"
+    using r_consistent_converg assms by simp
+  then show ?thesis using phi_def by simp
+qed
+
+lemma r_consist_phi_init:
+  assumes "f \<in> \<R>" and "\<phi> i \<in> \<R>"
+  shows "eval r_consist_phi [i, f \<triangleright> n] \<down>= (if \<forall>k\<le>n. \<phi> i k = f k then 0 else 1)"
+  using assms r_consist_phi R1_imp_total1 total1E by (simp add: r_consist_phi)
+
+lemma TOTAL_subseteq_CONS: "TOTAL \<subseteq> CONS"
+proof
+  fix U assume "U \<in> TOTAL"
+  then have "U \<in> TOTAL_wrt \<phi>"
+    using TOTAL_wrt_phi_eq_TOTAL by blast
+  then obtain t' where t': "learn_total \<phi> U t'"
+    using TOTAL_wrt_def by auto
+  then obtain t where t: "recfn 1 t" "\<And>x. eval t [x] = t' x"
+    using learn_totalE(1) P1E by blast
+  then have t_converg: "eval t [f \<triangleright> n] \<down>" if "f \<in> U" for f n
+    using t' learn_totalE(1) that by auto
+
+  define s where "s \<equiv> Cn 1 r_ifz [Cn 1 r_consist_phi [t, Id 1 0], t, r_auxhyp]"
+  then have "recfn 1 s"
+    using r_consist_phi_recfn r_auxhyp_prim t(1) by simp
+
+  have consist: "eval r_consist_phi [the (eval t [f \<triangleright> n]), f \<triangleright> n] \<down>=
+     (if \<forall>k\<le>n. \<phi> (the (eval t [f \<triangleright> n])) k = f k then 0 else 1)"
+    if "f \<in> U" for f n
+  proof -
+    have "eval r_consist_phi [the (eval t [f \<triangleright> n]), f \<triangleright> n] =
+        eval (Cn 1 r_consist_phi [t, Id 1 0]) [f \<triangleright> n]"
+      using that t_converg t(1) by simp
+    also have "... \<down>= (if \<forall>k\<le>n. \<phi> (the (eval t [f \<triangleright> n])) k = f k then 0 else 1)"
+    proof -
+      from that have "f \<in> \<R>"
+        using learn_totalE(1) t' by blast
+      moreover have "\<phi> (the (eval t [f \<triangleright> n])) \<in> \<R>"
+        using t' t learn_totalE t_converg that by simp
+      ultimately show ?thesis
+        using r_consist_phi_init t_converg t(1) that by simp
+    qed
+    finally show ?thesis .
+  qed
+
+  have s_eq_t: "eval s [f \<triangleright> n] = eval t [f \<triangleright> n]"
+    if "\<forall>k\<le>n. \<phi> (the (eval t [f \<triangleright> n])) k = f k" and "f \<in> U" for f n
+    using that consist s_def t r_auxhyp_prim prim_recfn_total
+    by simp
+
+  have s_eq_aux: "eval s [f \<triangleright> n] = eval r_auxhyp [f \<triangleright> n]"
+    if "\<not> (\<forall>k\<le>n. \<phi> (the (eval t [f \<triangleright> n])) k = f k)" and "f \<in> U" for f n
+  proof -
+    from that have "eval r_consist_phi [the (eval t [f \<triangleright> n]), f \<triangleright> n] \<down>= 1"
+      using consist by simp
+    moreover have "t' (f \<triangleright> n) \<down>" using t' learn_totalE(1) that(2) by blast
+    ultimately show ?thesis
+      using s_def t r_auxhyp_prim t' learn_totalE by simp
+  qed
+
+  have "learn_cons \<phi> U (\<lambda>e. eval s [e])"
+  proof (rule learn_consI)
+    have "eval s [f \<triangleright> n] \<down>" if "f \<in> U" for f n
+      using that t_converg[OF that, of n] s_eq_t[of n f] prim_recfn_total[of r_auxhyp 1]
+        r_auxhyp_prim s_eq_aux[OF _ that, of n] totalE
+      by fastforce
+    then show "environment \<phi> U (\<lambda>e. eval s [e])"
+      using t' `recfn 1 s` learn_totalE(1) by blast
+    show "\<exists>i. \<phi> i = f \<and> (\<forall>\<^sup>\<infinity>n. eval s [f \<triangleright> n] \<down>= i)" if "f \<in> U" for f
+    proof -
+      from that t' t learn_totalE obtain i n\<^sub>0 where
+        i_n0: "\<phi> i = f \<and> (\<forall>n\<ge>n\<^sub>0. eval t [f \<triangleright> n] \<down>= i)"
+        by metis
+      then have "\<And>n. n \<ge> n\<^sub>0 \<Longrightarrow> \<forall>k\<le>n. \<phi> (the (eval t [f \<triangleright> n])) k = f k"
+        by simp
+      with s_eq_t have "\<And>n. n \<ge> n\<^sub>0 \<Longrightarrow> eval s [f \<triangleright> n] = eval t [f \<triangleright> n]"
+        using that by simp
+      with i_n0 have "\<And>n. n \<ge> n\<^sub>0 \<Longrightarrow> eval s [f \<triangleright> n] \<down>= i"
+        by auto
+      with i_n0 show ?thesis by auto
+    qed
+    show "\<forall>k\<le>n. \<phi> (the (eval s [f \<triangleright> n])) k = f k" if "f \<in> U" for f n
+    proof (cases "\<forall>k\<le>n. \<phi> (the (eval t [f \<triangleright> n])) k = f k")
+      case True
+      with that s_eq_t show ?thesis by simp
+    next
+      case False
+      then have "eval s [f \<triangleright> n] = eval r_auxhyp [f \<triangleright> n]"
+        using that s_eq_aux by simp
+      moreover have "f \<in> \<R>"
+        using learn_totalE(1)[OF t'] that by auto
+      ultimately show ?thesis using r_auxhyp by simp
+    qed
+  qed
+  then show "U \<in> CONS" using CONS_def by auto
+qed
+
+
+subsection \<open>The separating class\<close>
+
+
+subsubsection \<open>Definition of the class\<close>
+
+text \<open>The class that will be shown to be in @{term "CONS - TOTAL"} is
+the union of the following two classes.\<close>
+
+definition V_constotal_1 :: "partial1 set" where
+  "V_constotal_1 \<equiv> {f. \<exists>j p. f = [j] \<odot> p \<and> j \<ge> 2 \<and> p \<in> \<R>\<^sub>0\<^sub>1 \<and> \<phi> j = f}"
+
+definition V_constotal_2 :: "partial1 set" where
+  "V_constotal_2 \<equiv>
+     {f. \<exists>j a k.
+            f = j # a @ [k] \<odot> 0\<^sup>\<infinity> \<and>
+            j \<ge> 2 \<and>
+            (\<forall>i<length a. a ! i \<le> 1) \<and>
+            k \<ge> 2 \<and>
+            \<phi> j = j # a \<odot> \<up>\<^sup>\<infinity> \<and>
+            \<phi> k = f}"
+
+definition V_constotal :: "partial1 set" where
+  "V_constotal \<equiv> V_constotal_1 \<union> V_constotal_2"
+
+lemma V_constotal_2I:
+  assumes "f = j # a @ [k] \<odot> 0\<^sup>\<infinity>"
+    and "j \<ge> 2"
+    and "\<forall>i<length a. a ! i \<le> 1"
+    and "k \<ge> 2"
+    and "\<phi> j = j # a \<odot> \<up>\<^sup>\<infinity>"
+    and "\<phi> k = f"
+  shows "f \<in> V_constotal_2"
+  using assms V_constotal_2_def by blast
+
+lemma V_subseteq_R1: "V_constotal \<subseteq> \<R>"
+proof
+  fix f assume "f \<in> V_constotal"
+  then have "f \<in> V_constotal_1 \<or> f \<in> V_constotal_2"
+    using V_constotal_def by auto
+  then show "f \<in> \<R>"
+  proof
+    assume "f \<in> V_constotal_1"
+    then obtain j p where "f = [j] \<odot> p" "p \<in> \<R>\<^sub>0\<^sub>1"
+      using V_constotal_1_def by blast
+    then show ?thesis using prepend_in_R1 RPred1_subseteq_R1 by auto
+  next
+    assume "f \<in> V_constotal_2"
+    then obtain j a k where "f = j # a @ [k] \<odot> 0\<^sup>\<infinity>"
+      using V_constotal_2_def by blast
+    then show ?thesis using almost0_in_R1 by auto
+  qed
+qed
+
+
+subsubsection \<open>The class is in CONS\<close>
+
+text \<open>The class can be learned by the strategy @{term rmge2}, which
+outputs the rightmost value greater or equal two in the input $f^n$. If $f$
+is from $V_1$ then the strategy is correct right from the start. If $f$ is
+from $V_2$ the strategy outputs the consistent hypothesis $j$ until it
+encounters the correct hypothesis $k$, to which it converges.\<close>
+
+lemma V_in_CONS: "learn_cons \<phi> V_constotal rmge2"
+proof (rule learn_consI)
+  show "environment \<phi> V_constotal rmge2"
+    using V_subseteq_R1 rmge2_in_R1 R1_imp_total1 phi_in_P2 by simp
+  have "(\<exists>i. \<phi> i = f \<and> (\<forall>\<^sup>\<infinity>n. rmge2 (f \<triangleright> n) \<down>= i)) \<and>
+      (\<forall>n. \<forall>k\<le>n. \<phi> (the (rmge2 (f \<triangleright> n))) k = f k)"
+    if "f \<in> V_constotal" for f
+  proof (cases "f \<in> V_constotal_1")
+    case True
+    then obtain j p where
+      f: "f = [j] \<odot> p" and
+      j: "j \<ge> 2" and
+      p: "p \<in> \<R>\<^sub>0\<^sub>1" and
+      phi_j: "\<phi> j = f"
+      using V_constotal_1_def by blast
+    then have "f 0 \<down>= j" by (simp add: prepend_at_less)
+    then have f_at_0: "the (f 0) \<ge> 2" by (simp add: j)
+    have f_at_gr0: "the (f x) \<le> 1" if "x > 0" for x
+      using that f p by (simp add: RPred1_altdef Suc_leI prepend_at_ge)
+    have "total1 f"
+      using V_subseteq_R1 that R1_imp_total1 total1_def by auto
+    have "rmge2 (f \<triangleright> n) \<down>= j" for n
+    proof -
+      let ?P = "\<lambda>i. i < Suc n \<and> the (f i) \<ge> 2"
+      have "Greatest ?P = 0"
+      proof (rule Greatest_equality)
+        show "0 < Suc n \<and> 2 \<le> the (f 0)"
+          using f_at_0 by simp
+        show "\<And>y. y < Suc n \<and> 2 \<le> the (f y) \<Longrightarrow> y \<le> 0"
+          using f_at_gr0 by fastforce
+      qed
+      then have "rmge2 (f \<triangleright> n) = f 0"
+        using f_at_0 rmge2_init_total[of f n, OF `total1 f`] by auto
+      then show "rmge2 (f \<triangleright> n) \<down>= j"
+        by (simp add: \<open>f 0 \<down>= j\<close>)
+    qed
+    then show ?thesis using phi_j by auto
+  next
+    case False
+    then have "f \<in> V_constotal_2"
+      using V_constotal_def that by auto
+    then obtain j a k where jak:
+      "f = j # a @ [k] \<odot> 0\<^sup>\<infinity>"
+      "j \<ge> 2"
+      "\<forall>i<length a. a ! i \<le> 1"
+      "k \<ge> 2"
+      "\<phi> j = j # a \<odot> \<up>\<^sup>\<infinity> "
+      "\<phi> k = f"
+      using V_constotal_2_def by blast
+    then have f_at_0: "f 0 \<down>= j" by simp
+    have f_eq_a: "f x \<down>= a ! (x - 1)" if "0 < x \<and> x < Suc (length a)" for x
+    proof -
+      have "x - 1 < length a"
+        using that by auto
+      then show ?thesis
+        by (simp add: jak(1) less_SucI nth_append that)
+    qed
+    then have f_at_a: "the (f x) \<le> 1" if "0 < x \<and> x < Suc (length a)" for x
+      using jak(3) that by auto
+    from jak have f_k: "f (Suc (length a)) \<down>= k" by auto
+    from jak have f_at_big: "f x \<down>= 0" if "x > Suc (length a)" for x
+      using that by simp
+    let ?P = "\<lambda>n i. i < Suc n \<and> the (f i) \<ge> 2"
+    have rmge2: "rmge2 (f \<triangleright> n) = f (Greatest (?P n))" for n
+    proof -
+      have "\<not> (\<forall>i<Suc n. the (f i) < 2)" for n
+        using jak(2) f_at_0 by auto
+      moreover have "total1 f"
+        using V_subseteq_R1 R1_imp_total1 that total1_def by auto
+      ultimately show ?thesis using rmge2_init_total[of f n] by auto
+    qed
+    have "Greatest (?P n) = 0" if "n < Suc (length a)" for n
+    proof (rule Greatest_equality)
+      show "0 < Suc n \<and> 2 \<le> the (f 0)"
+        using that by (simp add: jak(2) f_at_0)
+      show "\<And>y. y < Suc n \<and> 2 \<le> the (f y) \<Longrightarrow> y \<le> 0"
+        using that f_at_a
+        by (metis Suc_1 dual_order.strict_trans leI less_Suc_eq not_less_eq_eq)
+    qed
+    with rmge2 f_at_0 have rmge2_small:
+      "rmge2 (f \<triangleright> n) \<down>= j" if "n < Suc (length a)" for n
+      using that by simp
+    have "Greatest (?P n) = Suc (length a)" if "n \<ge> Suc (length a)" for n
+    proof (rule Greatest_equality)
+      show "Suc (length a) < Suc n \<and> 2 \<le> the (f (Suc (length a)))"
+        using that f_k by (simp add: jak(4) less_Suc_eq_le)
+      show "\<And>y. y < Suc n \<and> 2 \<le> the (f y) \<Longrightarrow> y \<le> Suc (length a)"
+        using that f_at_big by (metis leI le_SucI not_less_eq_eq numeral_2_eq_2 option.sel)
+    qed
+    with rmge2 f_at_big f_k have rmge2_big:
+      "rmge2 (f \<triangleright> n) \<down>= k" if "n \<ge> Suc (length a)" for n
+      using that by simp
+    then have "\<exists>i n\<^sub>0. \<phi> i = f \<and> (\<forall>n\<ge>n\<^sub>0. rmge2 (f \<triangleright> n) \<down>= i)"
+      using jak(6) by auto
+    moreover have "\<forall>k\<le>n. \<phi> (the (rmge2 (f \<triangleright> n))) k = f k" for n
+    proof (cases "n < Suc (length a)")
+      case True
+      then have "rmge2 (f \<triangleright> n) \<down>= j"
+        using rmge2_small by simp
+      then have "\<phi> (the (rmge2 (f \<triangleright> n))) = \<phi> j" by simp
+      with True show ?thesis
+        using rmge2_small f_at_0 f_eq_a jak(5) prepend_at_less
+        by (metis le_less_trans le_zero_eq length_Cons not_le_imp_less nth_Cons_0 nth_Cons_pos)
+    next
+      case False
+      then show ?thesis using rmge2_big jak by simp
+    qed
+    ultimately show ?thesis by simp
+  qed
+  then show "\<And>f. f \<in> V_constotal \<Longrightarrow> \<exists>i. \<phi> i = f \<and> (\<forall>\<^sup>\<infinity>n. rmge2 (f \<triangleright> n) \<down>= i)"
+    and "\<And>f n. f \<in> V_constotal \<Longrightarrow> \<forall>k\<le>n. \<phi> (the (rmge2 (f \<triangleright> n))) k = f k"
+    by simp_all
+qed
+
+
+subsubsection \<open>The class is not in TOTAL\<close>
+
+text \<open>Recall that $V$ is the union of $V_1 = \{jp \mid j\geq2 \land p \in
+\mathcal{R}_{01} \land \varphi_j = jp\}$ and $V_2 = \{jak0^\infty \mid j\geq 2 \land a
+\in \{0, 1\}^* \land k\geq 2 \land \varphi_j = ja\uparrow^\infty \land\ 
+\varphi_k = jak0^\infty\}$.\<close>
+
+text \<open>The proof is adapted from a proof of a stronger result by
+Freivalds, Kinber, and Wiehagen~\cite[Theorem~27]{fkw-iisde-95} concerning an
+inference type not defined here.
+
+The proof is by contradiction. If $V$ was in TOTAL, there would be
+a strategy $S$ learning $V$ in our standard Gödel numbering $\varphi$.
+By Lemma R for TOTAL we can assume $S$ to be total.
+
+In order to construct a function $f\in V$ for which $S$ fails we employ a
+computable process iteratively building function prefixes. For every $j$ the
+process builds a function $\psi_j$. The initial prefix is the singleton
+$[j]$. Given a prefix $b$, the next prefix is determined as follows:
+\begin{enumerate}
+\item Search for a $y \geq |b|$ with $\varphi_{S(b)}(y) \downarrow= v$ for
+some $v$.
+\item Set the new prefix $b0^{y - |b|}\bar{v}$, where $\bar v = 1 - v$.
+\end{enumerate}
+
+Step~1 can diverge, for example, if $\varphi_{S(b)}$ is the empty function.
+In this case $\psi_j$ will only be defined for a finite prefix. If, however,
+Step~2 is reached, the prefix $b$ is extended to a $b'$ such that
+$\varphi_{S(b)}(y) \neq b'_y$, which implies $S(b)$ is a wrong hypothesis for
+every function starting with $b'$, in particular for $\psi_j$. Since $\bar v
+\in \{0, 1\}$, Step~2 only appends zeros and ones, which is important for
+showing membership in $V$.
+
+This process defines a numbering $\psi \in \mathcal{P}^2$, and by Kleene's
+fixed-point theorem there is a $j \geq 2$ with $\varphi_j = \psi_j$. For this
+$j$ there are two cases:
+\begin{enumerate}
+\item[Case 1.] Step~1 always succeeds. Then $\psi_j$ is total and
+  $\psi_j \in V_1$. But $S$ outputs wrong hypotheses on infinitely many
+  prefixes of $\psi_j$ (namely every prefix constructed by the process).
+
+\item[Case 2.] Step~1 diverges at some iteration, say when the state is $b = ja$
+  for some $a \in \{0, 1\}^*$.
+  Then $\psi_j$ has the form $ja\uparrow^\infty$. The numbering $\chi$ with $\chi_k =
+  jak0^\infty$ is in $\mathcal{P}^2$, and by Kleene's fixed-point theorem there is a
+  $k\geq 2$ with $\varphi_k = \chi_k = jak0^\infty$. This $jak0^\infty$ is in
+  $V_2$ and has the prefix $ja$. But Step~1 diverged on this prefix, which
+  means there is no $y \geq |ja|$ with $\varphi_{S(ja)}(y)\downarrow$. In
+  other words $S$ hypothesizes a non-total function.
+\end{enumerate}
+
+Thus, in both cases there is a function in $V$ where $S$ does not behave like
+a TOTAL strategy. This is the desired contradiction.
+
+The following locale formalizes this proof sketch.\<close>
+
+locale total_cons =
+  fixes s :: partial1
+  assumes s_in_R1: "s \<in> \<R>"
+begin
+
+definition r_s :: recf where
+  "r_s \<equiv> SOME r_s. recfn 1 r_s \<and>  total r_s \<and> s = (\<lambda>x. eval r_s [x])"
+
+lemma rs_recfn [simp]: "recfn 1 r_s"
+  and rs_total [simp]: "\<And>x. eval r_s [x] \<down>"
+  and eval_rs: "\<And>x. s x = eval r_s [x]"
+  using r_s_def R1_SOME[OF s_in_R1, of r_s] by simp_all
+
+text \<open>Performing Step~1 means enumerating the domain of
+$\varphi_{S(b)}$ until a $y \geq |b|$ is found. The next function enumerates
+all domain values and checks the condition for them.\<close>
+
+definition "r_search_enum \<equiv>
+  Cn 2 r_le [Cn 2 r_length [Id 2 1], Cn 2 r_enumdom [Cn 2 r_s [Id 2 1], Id 2 0]]"
+
+lemma r_search_enum_recfn [simp]: "recfn 2 r_search_enum"
+  by (simp add: r_search_enum_def Let_def)
+
+abbreviation search_enum :: partial2 where
+  "search_enum x b \<equiv> eval r_search_enum [x, b]"
+
+abbreviation enumdom :: partial2 where
+  "enumdom i y \<equiv> eval r_enumdom [i, y]"
+
+lemma enumdom_empty_domain:
+  assumes "\<And>x. \<phi> i x \<up>"
+  shows "\<And>y. enumdom i y \<up>"
+  using assms r_enumdom_empty_domain by (simp add: phi_def)
+
+lemma enumdom_nonempty_domain:
+  assumes "\<phi> i x\<^sub>0 \<down>"
+  shows "\<And>y. enumdom i y \<down>"
+   and "\<And>x. \<phi> i x \<down> \<longleftrightarrow> (\<exists>y. enumdom i y \<down>= x)"
+  using assms r_enumdom_nonempty_domain phi_def by metis+
+
+text \<open>Enumerating the empty domain yields the empty function.\<close>
+
+lemma search_enum_empty:
+  fixes b :: nat
+  assumes "s b \<down>= i" and "\<And>x. \<phi> i x \<up>"
+  shows "\<And>x. search_enum x b \<up>"
+  using assms r_search_enum_def enumdom_empty_domain eval_rs by simp
+
+text \<open>Enumerating a non-empty domain yields a total function.\<close>
+
+lemma search_enum_nonempty:
+  fixes b y0 :: nat
+  assumes "s b \<down>= i" and "\<phi> i y\<^sub>0 \<down>" and "e = the (enumdom i x)"
+  shows "search_enum x b \<down>= (if e_length b \<le> e then 0 else 1)"
+proof -
+  let ?e = "\<lambda>x. the (enumdom i x)"
+  let ?y = "Cn 2 r_enumdom [Cn 2 r_s [Id 2 1], Id 2 0]"
+  have "recfn 2 ?y" using assms(1) by simp
+  moreover have "\<And>x. eval ?y [x, b] = enumdom i x"
+    using assms(1,2) eval_rs by auto
+  moreover from this have "\<And>x. eval ?y [x, b] \<down>"
+    using enumdom_nonempty_domain(1)[OF assms(2)] by simp
+  ultimately have "eval (Cn 2 r_le [Cn 2 r_length [Id 2 1], ?y]) [x, b] \<down>=
+      (if e_length b \<le> ?e x then 0 else 1)"
+    by simp
+  then show ?thesis using assms by (simp add: r_search_enum_def)
+qed
+
+text \<open>If there is a $y$ as desired, the enumeration will eventually return
+zero (representing ``true'').\<close>
+
+lemma search_enum_nonempty_eq0:
+  fixes b y :: nat
+  assumes "s b \<down>= i" and "\<phi> i y \<down>" and "y \<ge> e_length b"
+  shows "\<exists>x. search_enum x b \<down>= 0"
+proof -
+  obtain x where x: "enumdom i x \<down>= y"
+    using enumdom_nonempty_domain(2)[OF assms(2)] assms(2) by auto
+  from assms(2) have "\<phi> i y \<down>" by simp
+  with x have "search_enum x b \<down>= 0"
+    using search_enum_nonempty[where ?e=y] assms by auto
+  then show ?thesis by auto
+qed
+
+text \<open>If there is no $y$ as desired, the enumeration will never return
+zero.\<close>
+
+lemma search_enum_nonempty_neq0:
+  fixes b y0 :: nat
+  assumes "s b \<down>= i"
+    and "\<phi> i y\<^sub>0 \<down>"
+    and "\<not> (\<exists>y. \<phi> i y \<down> \<and> y \<ge> e_length b)"
+  shows "\<not> (\<exists>x. search_enum x b \<down>= 0)"
+proof
+  assume "\<exists>x. search_enum x b \<down>= 0"
+  then obtain x where x: "search_enum x b \<down>= 0"
+    by auto
+  obtain y where y: "enumdom i x \<down>= y"
+    using enumdom_nonempty_domain[OF assms(2)] by blast
+  then have "search_enum x b \<down>= (if e_length b \<le> y then 0 else 1)"
+    using assms(1-2) search_enum_nonempty by simp
+  with x have "e_length b \<le> y"
+    using option.inject by fastforce
+  moreover have "\<phi> i y \<down>"
+    using assms(2) enumdom_nonempty_domain(2) y by blast
+  ultimately show False using assms(3) by force
+qed
+
+text \<open>The next function corresponds to Step~1. Given a prefix $b$ it
+computes a $y \geq |b|$ with $\varphi_{S(b)}(y)\downarrow$ if such a $y$
+exists; otherwise it diverges.\<close>
+
+definition "r_search \<equiv> Cn 1 r_enumdom [r_s, Mn 1 r_search_enum]"
+
+lemma r_search_recfn [simp]: "recfn 1 r_search"
+  using r_search_def by simp
+
+abbreviation search :: partial1 where
+  "search b \<equiv> eval r_search [b]"
+
+text \<open>If $\varphi_{S(b)}$ is the empty function, the search process
+diverges because already the enumeration of the domain diverges.\<close>
+
+lemma search_empty:
+  assumes "s b \<down>= i" and "\<And>x. \<phi> i x \<up>"
+  shows "search b \<up>"
+proof -
+  have "\<And>x. search_enum x b \<up>"
+    using search_enum_empty[OF assms] by simp
+  then have "eval (Mn 1 r_search_enum) [b] \<up>" by simp
+  then show "search b \<up>" unfolding r_search_def by simp
+qed
+
+text \<open>If $\varphi_{S(b)}$ is non-empty, but there is no $y$ with the
+desired properties, the search process diverges.\<close>
+
+lemma search_nonempty_neq0:
+  fixes b y0 :: nat
+  assumes "s b \<down>= i"
+    and "\<phi> i y\<^sub>0 \<down>"
+    and "\<not> (\<exists>y. \<phi> i y \<down> \<and> y \<ge> e_length b)"
+  shows "search b \<up>"
+proof -
+  have "\<not> (\<exists>x. search_enum x b \<down>= 0)"
+    using assms search_enum_nonempty_neq0 by simp
+  moreover have "recfn 1 (Mn 1 r_search_enum)"
+    by (simp add: assms(1))
+  ultimately have "eval (Mn 1 r_search_enum) [b] \<up>" by simp
+  then show ?thesis using r_search_def by auto
+qed
+
+text \<open>If there is a $y$ as desired, the search process will return
+one such $y$.\<close>
+
+lemma search_nonempty_eq0:
+  fixes b y :: nat
+  assumes "s b \<down>= i" and "\<phi> i y \<down>" and "y \<ge> e_length b"
+  shows "search b \<down>"
+    and "\<phi> i (the (search b)) \<down>"
+    and "the (search b) \<ge> e_length b"
+proof -
+  have "\<exists>x. search_enum x b \<down>= 0"
+    using assms search_enum_nonempty_eq0 by simp
+  moreover have "\<forall>x. search_enum x b \<down>"
+    using assms search_enum_nonempty by simp
+  moreover have "recfn 1 (Mn 1 r_search_enum)"
+    by simp
+  ultimately have
+    1: "search_enum (the (eval (Mn 1 r_search_enum) [b])) b \<down>= 0" and
+    2: "eval (Mn 1 r_search_enum) [b] \<down>"
+    using eval_Mn_diverg eval_Mn_convergE[of 1 "r_search_enum" "[b]"]
+    by (metis (no_types, lifting) One_nat_def length_Cons list.size(3) option.collapse,
+      metis (no_types, lifting) One_nat_def length_Cons list.size(3))
+  let ?x = "the (eval (Mn 1 r_search_enum) [b])"
+  have "search b = eval (Cn 1 r_enumdom [r_s, Mn 1 r_search_enum]) [b]"
+    unfolding r_search_def by simp
+  then have 3: "search b = enumdom i ?x"
+    using assms 2 eval_rs by simp
+  then have "the (search b) = the (enumdom i ?x)" (is "?y = _")
+    by simp
+  then have 4: "search_enum ?x b \<down>= (if e_length b \<le> ?y then 0 else 1)"
+    using search_enum_nonempty assms by simp
+  from 3 have "\<phi> i ?y \<down>"
+    using enumdom_nonempty_domain assms(2) by (metis option.collapse)
+  then show "\<phi> i ?y \<down>"
+    using phi_def by simp
+  then show "?y \<ge> e_length b"
+    using assms 4 1 option.inject by fastforce
+  show "search b \<down>"
+    using 3 assms(2) enumdom_nonempty_domain(1) by auto
+qed
+
+text \<open>The converse of the previous lemma states that whenever
+the search process returns a value it will be one with the
+desired properties.\<close>
+
+lemma search_converg:
+  assumes "s b \<down>= i" and "search b \<down>" (is "?y \<down>")
+  shows "\<phi> i (the ?y) \<down>"
+    and "the ?y \<ge> e_length b"
+proof -
+  have "\<exists>y. \<phi> i y \<down>"
+    using assms search_empty by meson
+  then have "\<exists>y. y \<ge> e_length b \<and> \<phi> i y \<down>"
+    using search_nonempty_neq0 assms by meson
+  then obtain y where y: "y \<ge> e_length b \<and> \<phi> i y \<down>" by auto
+  then have "\<phi> i y \<down>"
+    using phi_def by simp
+  then show "\<phi> i (the (search b)) \<down>"
+    and "(the (search b)) \<ge> e_length b"
+    using y assms search_nonempty_eq0[OF assms(1) `\<phi> i y \<down>`] by simp_all
+qed
+
+text \<open>Likewise, if the search diverges, there is no appropriate $y$.\<close>
+
+lemma search_diverg:
+  assumes "s b \<down>= i" and "search b \<up>"
+  shows "\<not> (\<exists>y. \<phi> i y \<down> \<and> y \<ge> e_length b)"
+proof
+  assume "\<exists>y. \<phi> i y \<down> \<and> y \<ge> e_length b"
+  then obtain y where y: "\<phi> i y \<down>" "y \<ge> e_length b"
+    by auto
+  from y(1) have "\<phi> i y \<down>"
+    by (simp add: phi_def)
+  with y(2) search_nonempty_eq0 have "search b \<down>"
+    using assms by blast
+  with assms(2) show False by simp
+qed
+
+text \<open>Step~2 extends the prefix by a block of the shape $0^n\bar v$.
+The next function constructs such a block for given $n$ and $v$.\<close>
+
+definition "r_badblock \<equiv>
+  let f = Cn 1 r_singleton_encode [r_not];
+      g = Cn 3 r_cons [r_constn 2 0, Id 3 1]
+  in Pr 1 f g"
+
+lemma r_badblock_prim [simp]: "recfn 2 r_badblock"
+  unfolding r_badblock_def by simp
+
+lemma r_badblock: "eval r_badblock [n, v] \<down>= list_encode (replicate n 0 @ [1 - v])"
+proof (induction n)
+  case 0
+  let ?f = "Cn 1 r_singleton_encode [r_not]"
+  have "eval r_badblock [0, v] = eval ?f [v]"
+    unfolding r_badblock_def by simp
+  also have "... = eval r_singleton_encode [the (eval r_not [v])]"
+    by simp
+  also have "... \<down>= list_encode [1 - v]"
+    by simp
+  finally show ?case by simp
+next
+  case (Suc n)
+  let ?g = "Cn 3 r_cons [r_constn 2 0, Id 3 1]"
+  have "recfn 3 ?g" by simp
+  have "eval r_badblock [(Suc n), v] = eval ?g [n, the (eval r_badblock [n , v]), v]"
+    using `recfn 3 ?g` Suc by (simp add: r_badblock_def)
+  also have "... = eval ?g [n, list_encode (replicate n 0 @ [1 - v]), v]"
+    using Suc by simp
+  also have "... = eval r_cons [0, list_encode (replicate n 0 @ [1 - v])]"
+    by simp
+  also have "... \<down>= e_cons 0 (list_encode (replicate n 0 @ [1 - v]))"
+    by simp
+  also have "... \<down>= list_encode (0 # (replicate n 0 @ [1 - v]))"
+    by simp
+  also have "... \<down>= list_encode (replicate (Suc n) 0 @ [1 - v])"
+    by simp
+  finally show ?case by simp
+qed
+
+lemma r_badblock_only_01: "e_nth (the (eval r_badblock [n, v])) i \<le> 1"
+  using r_badblock by (simp add: nth_append)
+
+lemma r_badblock_last: "e_nth (the (eval r_badblock [n, v])) n = 1 - v"
+  using r_badblock by (simp add: nth_append)
+
+text \<open>The following function computes the next prefix from the current
+one. In other words, it performs Steps~1 and~2.\<close>
+
+definition "r_next \<equiv>
+  Cn 1 r_append
+   [Id 1 0,
+    Cn 1 r_badblock
+     [Cn 1 r_sub [r_search, r_length],
+      Cn 1 r_phi [r_s, r_search]]]"
+
+lemma r_next_recfn [simp]: "recfn 1 r_next"
+  unfolding r_next_def by simp
+
+text \<open>The name @{text next} is unavailable, so we go for @{term nxt}.\<close>
+
+abbreviation nxt :: partial1 where
+  "nxt b \<equiv> eval r_next [b]"
+
+lemma nxt_diverg:
+  assumes "search b \<up>"
+  shows "nxt b \<up>"
+  unfolding r_next_def using assms by (simp add: Let_def)
+
+lemma nxt_converg:
+  assumes "search b \<down>= y"
+  shows "nxt b \<down>=
+     e_append b (list_encode (replicate (y - e_length b) 0 @ [1 - the (\<phi> (the (s b)) y)]))"
+  unfolding r_next_def using assms r_badblock search_converg phi_def eval_rs
+  by fastforce
+
+lemma nxt_search_diverg:
+  assumes "nxt b \<up>"
+  shows "search b \<up>"
+proof (rule ccontr)
+  assume "search b \<down>"
+  then obtain y where "search b \<down>= y" by auto
+  then show False
+    using nxt_converg assms by simp
+qed
+
+text \<open>If Step~1 finds a $y$, the hypothesis $S(b)$ is incorrect for
+the new prefix.\<close>
+
+lemma nxt_wrong_hyp:
+  assumes "nxt b \<down>= b'" and "s b \<down>= i"
+  shows "\<exists>y<e_length b'. \<phi> i y \<down>\<noteq> e_nth b' y"
+proof -
+  obtain y where y: "search b \<down>= y"
+    using assms nxt_diverg by fastforce
+  then have y_len: "y \<ge> e_length b"
+    using assms search_converg(2) by fastforce
+  then have b': "b' =
+      (e_append b (list_encode (replicate (y - e_length b) 0 @ [1 - the (\<phi> i y)])))"
+    using y assms nxt_converg by simp
+  then have "e_nth b' y = 1 - the (\<phi> i y)"
+    using y_len e_nth_append_big r_badblock r_badblock_last by auto
+  moreover have "\<phi> i y \<down>"
+    using search_converg y y_len assms(2) by fastforce
+  ultimately have "\<phi> i y \<down>\<noteq> e_nth b' y"
+    by (metis gr_zeroI less_numeral_extra(4) less_one option.sel zero_less_diff)
+  moreover have "e_length b' = Suc y"
+    using y_len e_length_append b' by auto
+  ultimately show ?thesis by auto
+qed
+
+text \<open>If Step~1 diverges, the hypothesis $S(b)$ refers to a non-total
+function.\<close>
+
+lemma nxt_nontotal_hyp:
+  assumes "nxt b \<up>" and "s b \<down>= i"
+  shows "\<exists>x. \<phi> i x \<up>"
+  using nxt_search_diverg[OF assms(1)] search_diverg[OF assms(2)] by auto
+
+text \<open>The process only ever extends the given prefix.\<close>
+
+lemma nxt_stable:
+  assumes "nxt b \<down>= b'"
+  shows "\<forall>x<e_length b. e_nth b x = e_nth b' x"
+proof -
+  obtain y where y: "search b \<down>= y"
+    using assms nxt_diverg by fastforce
+  then have "y \<ge> e_length b"
+    using search_converg(2) eval_rs rs_total by fastforce
+  show ?thesis
+  proof (rule allI, rule impI)
+    fix x assume "x < e_length b"
+    let ?i = "the (s b)"
+    have b': "b' =
+        (e_append b (list_encode (replicate (y - e_length b) 0 @ [1 - the (\<phi> ?i y)])))"
+      using assms nxt_converg[OF y] by auto
+    then show "e_nth b x = e_nth b' x"
+      using e_nth_append_small \<open>x < e_length b\<close> by auto
+  qed
+qed
+
+text \<open>The following properties of @{term r_next} will be
+used to show that some of the constructed functions are in the class
+$V$.\<close>
+
+lemma nxt_append_01:
+  assumes "nxt b \<down>= b'"
+  shows "\<forall>x. x \<ge> e_length b \<and> x < e_length b' \<longrightarrow>  e_nth b' x = 0 \<or> e_nth b' x = 1"
+proof -
+  obtain y where y: "search b \<down>= y"
+    using assms nxt_diverg by fastforce
+  let ?i = "the (s b)"
+  have b': "b' = (e_append b (list_encode (replicate (y - e_length b) 0 @ [1 - the (\<phi> ?i y)])))"
+    (is "b' = (e_append b ?z)")
+    using assms y  nxt_converg prod_encode_eq by auto
+  show ?thesis
+  proof (rule allI, rule impI)
+    fix x assume x: "e_length b \<le> x \<and> x < e_length b'"
+    then have "e_nth b' x = e_nth ?z (x - e_length b)"
+      using b' e_nth_append_big by blast
+    then show "e_nth b' x = 0 \<or> e_nth b' x = 1"
+      by (metis less_one nat_less_le option.sel r_badblock r_badblock_only_01)
+  qed
+qed
+
+lemma nxt_monotone:
+  assumes "nxt b \<down>= b'"
+  shows "e_length b < e_length b'"
+proof -
+  obtain y where y: "search b \<down>= y"
+    using assms nxt_diverg by fastforce
+  let ?i = "the (s b)"
+  have b': "b' =
+      (e_append b (list_encode (replicate (y - e_length b) 0 @ [1 - the (\<phi> ?i y)])))"
+    using assms y nxt_converg prod_encode_eq by auto
+  then show ?thesis using e_length_append by auto
+qed
+
+text \<open>The next function computes the prefixes after each iteration of
+the process @{term r_next} when started with the list $[j]$.\<close>
+
+definition r_prefixes :: recf where
+  "r_prefixes \<equiv> Pr 1 r_singleton_encode (Cn 3 r_next [Id 3 1])"
+
+lemma r_prefixes_recfn [simp]: "recfn 2 r_prefixes"
+  unfolding r_prefixes_def by (simp add: Let_def)
+
+abbreviation prefixes :: partial2 where
+  "prefixes t j \<equiv> eval r_prefixes [t, j]"
+
+lemma prefixes_at_0: "prefixes 0 j \<down>= list_encode [j]"
+  unfolding r_prefixes_def by simp
+
+lemma prefixes_at_Suc:
+  assumes "prefixes t j \<down>" (is "?b \<down>")
+  shows "prefixes (Suc t) j = nxt (the ?b)"
+  using r_prefixes_def assms by auto
+
+lemma prefixes_at_Suc':
+  assumes "prefixes t j \<down>= b"
+  shows "prefixes (Suc t) j = nxt b"
+  using r_prefixes_def assms by auto
+
+lemma prefixes_prod_encode:
+  assumes "prefixes t j \<down>"
+  obtains b where "prefixes t j \<down>= b"
+  using assms surj_prod_encode by force
+
+lemma prefixes_converg_le:
+  assumes "prefixes t j \<down>" and "t' \<le> t"
+  shows "prefixes t' j \<down>"
+  using r_prefixes_def assms eval_Pr_converg_le[of 1 _ _ "[j]"]
+  by simp
+
+lemma prefixes_diverg_add:
+  assumes "prefixes t j \<up>"
+  shows "prefixes (t + d) j \<up>"
+  using r_prefixes_def assms eval_Pr_diverg_add[of 1 _ _ "[j]"]
+  by simp
+
+text \<open>Many properties of @{term r_prefixes} can be derived from similar
+properties of @{term r_next}.\<close>
+
+lemma prefixes_length:
+  assumes "prefixes t j \<down>= b"
+  shows "e_length b > t"
+proof (insert assms, induction t arbitrary: b)
+  case 0
+  then show ?case using prefixes_at_0 prod_encode_eq by auto
+next
+  case (Suc t)
+  then have "prefixes t j \<down>"
+    using prefixes_converg_le Suc_n_not_le_n nat_le_linear by blast
+  then obtain b' where b': "prefixes t j \<down>= b'"
+    using prefixes_prod_encode by blast
+  with Suc have "e_length b' > t" by simp
+  have "prefixes (Suc t) j = nxt b'"
+    using b' prefixes_at_Suc' by simp
+  with Suc have "nxt b' \<down>= b" by simp
+  then have "e_length b' < e_length b"
+    using nxt_monotone by simp
+  then show ?case using `e_length b' > t` by simp
+qed
+
+lemma prefixes_monotone:
+  assumes "prefixes t j \<down>= b" and "prefixes (t + d) j \<down>= b'"
+  shows "e_length b \<le> e_length b'"
+proof (insert assms, induction d arbitrary: b')
+  case 0
+  then show ?case using prod_encode_eq by simp
+next
+  case (Suc d)
+  moreover have "t + d \<le> t + Suc d" by simp
+  ultimately have "prefixes (t + d) j \<down>"
+    using prefixes_converg_le by blast
+  then obtain b'' where b'': "prefixes (t + d) j \<down>= b''"
+    using prefixes_prod_encode by blast
+  with Suc have "prefixes (t + Suc d) j = nxt b''"
+    by (simp add: prefixes_at_Suc')
+  with Suc have "nxt b'' \<down>= b'" by simp
+  then show ?case using nxt_monotone Suc b'' by fastforce
+qed
+
+lemma prefixes_stable:
+  assumes "prefixes t j \<down>= b" and "prefixes (t + d) j \<down>= b'"
+  shows "\<forall>x<e_length b. e_nth b x = e_nth b' x"
+proof (insert assms, induction d arbitrary: b')
+  case 0
+  then show ?case using prod_encode_eq by simp
+next
+  case (Suc d)
+  moreover have "t + d \<le> t + Suc d" by simp
+  ultimately have "prefixes (t + d) j \<down>"
+    using prefixes_converg_le by blast
+  then obtain b'' where b'': "prefixes (t + d) j \<down>= b''"
+    using prefixes_prod_encode by blast
+  with Suc have "prefixes (t + Suc d) j = nxt b''"
+    by (simp add: prefixes_at_Suc')
+  with Suc have b': "nxt b'' \<down>= b'" by simp
+  show "\<forall>x<e_length b. e_nth b x = e_nth b' x"
+  proof (rule allI, rule impI)
+    fix x assume x: "x < e_length b"
+    then have "e_nth b x = e_nth b'' x"
+      using Suc b'' by simp
+    moreover have "x \<le> e_length b''"
+      using x prefixes_monotone b'' Suc by fastforce
+    ultimately show "e_nth b x = e_nth b' x"
+      using b'' nxt_stable Suc b' prefixes_monotone x
+      by (metis leD le_neq_implies_less)
+  qed
+qed
+
+lemma prefixes_tl_only_01:
+  assumes "prefixes t j \<down>= b"
+  shows "\<forall>x>0. e_nth b x = 0 \<or> e_nth b x = 1"
+proof (insert assms, induction t arbitrary: b)
+  case 0
+  then show ?case using prefixes_at_0 prod_encode_eq by auto
+next
+  case (Suc t)
+  then have "prefixes t j \<down>"
+    using prefixes_converg_le Suc_n_not_le_n nat_le_linear by blast
+  then obtain b' where b': "prefixes t j \<down>= b'"
+    using prefixes_prod_encode by blast
+  show "\<forall>x>0. e_nth b x = 0 \<or> e_nth b x = 1"
+  proof (rule allI, rule impI)
+    fix x :: nat
+    assume x: "x > 0"
+    show "e_nth b x = 0 \<or> e_nth b x = 1"
+    proof (cases "x < e_length b'")
+      case True
+      then show ?thesis
+        using Suc b' prefixes_at_Suc' nxt_stable x by metis
+    next
+      case False
+      then show ?thesis
+        using Suc.prems b' prefixes_at_Suc' nxt_append_01 by auto
+    qed
+  qed
+qed
+
+lemma prefixes_hd:
+  assumes "prefixes t j \<down>= b"
+  shows "e_nth b 0 = j"
+proof -
+  obtain b' where b': "prefixes 0 j \<down>= b'"
+    by (simp add: prefixes_at_0)
+  then have "b' = list_encode [j]"
+    by (simp add: prod_encode_eq prefixes_at_0)
+  then have "e_nth b' 0 = j" by simp
+  then show "e_nth b 0 = j"
+    using assms prefixes_stable[OF b', of t b] prefixes_length[OF b'] by simp
+qed
+
+lemma prefixes_nontotal_hyp:
+  assumes "prefixes t j \<down>= b"
+    and "prefixes (Suc t) j \<up>"
+    and "s b \<down>= i"
+  shows "\<exists>x. \<phi> i x \<up>"
+  using nxt_nontotal_hyp[OF _ assms(3)] assms(2) prefixes_at_Suc'[OF assms(1)] by simp
+
+text \<open>We now consider the two cases from the proof sketch.\<close>
+
+abbreviation "case_two j \<equiv> \<exists>t. prefixes t j \<up>"
+
+abbreviation "case_one j \<equiv> \<not> case_two j"
+
+text \<open>In Case~2 there is a maximum convergent iteration because
+iteration 0 converges.\<close>
+
+lemma case_two:
+  assumes "case_two j"
+  shows "\<exists>t. (\<forall>t'\<le>t. prefixes t' j \<down>) \<and> (\<forall>t'>t. prefixes t' j \<up>)"
+proof -
+  let ?P = "\<lambda>t. prefixes t j \<up>"
+  define t\<^sub>0 where "t\<^sub>0 = Least ?P"
+  then have "?P t\<^sub>0"
+    using assms LeastI_ex[of ?P] by simp
+  then have diverg: "?P t" if "t \<ge> t\<^sub>0" for t
+    using prefixes_converg_le that by blast
+  from t\<^sub>0_def have converg: "\<not> ?P t" if "t < t\<^sub>0" for t
+    using Least_le[of ?P] that not_less by blast
+  have "t\<^sub>0 > 0"
+  proof (rule ccontr)
+    assume "\<not> 0 < t\<^sub>0"
+    then have "t\<^sub>0 = 0" by simp
+    with `?P t\<^sub>0` prefixes_at_0 show False by simp
+  qed
+  let ?t = "t\<^sub>0 - 1"
+  have "\<forall>t'\<le>?t. prefixes t' j \<down>"
+    using converg \<open>0 < t\<^sub>0\<close> by auto
+  moreover have "\<forall>t'>?t. prefixes t' j \<up>"
+    using diverg by simp
+  ultimately show ?thesis by auto
+qed
+
+text \<open>Having completed the modelling of the process, we can now define
+the functions $\psi_j$ it computes. The value $\psi_j(x)$ is computed by
+running @{term r_prefixes} until the prefix is longer than $x$ and then
+taking the $x$-th element of the prefix.\<close>
+
+definition "r_psi \<equiv>
+  let f = Cn 3 r_less [Id 3 2, Cn 3 r_length [Cn 3 r_prefixes [Id 3 0, Id 3 1]]]
+  in Cn 2 r_nth [Cn 2 r_prefixes [Mn 2 f, Id 2 0], Id 2 1]"
+
+lemma r_psi_recfn: "recfn 2 r_psi"
+  unfolding r_psi_def by simp
+
+abbreviation psi :: partial2 ("\<psi>") where
+  "\<psi> j x \<equiv> eval r_psi [j, x]"
+
+lemma psi_in_P2: "\<psi> \<in> \<P>\<^sup>2"
+  using r_psi_recfn by auto
+
+text \<open>The values of @{term "\<psi>"} can be read off the prefixes.\<close>
+
+lemma psi_eq_nth_prefix:
+  assumes "prefixes t j \<down>= b" and "e_length b > x"
+  shows "\<psi> j x \<down>= e_nth b x"
+proof -
+  let ?f = "Cn 3 r_less [Id 3 2, Cn 3 r_length [Cn 3 r_prefixes [Id 3 0, Id 3 1]]]"
+  let ?P = "\<lambda>t. prefixes t j \<down> \<and> e_length (the (prefixes t j)) > x"
+  from assms have ex_t: "\<exists>t. ?P t" by auto
+  define t\<^sub>0 where "t\<^sub>0 = Least ?P"
+  then have "?P t\<^sub>0"
+    using LeastI_ex[OF ex_t] by simp
+  from ex_t have not_P: "\<not> ?P t" if "t < t\<^sub>0" for t
+    using ex_t that Least_le[of ?P] not_le t\<^sub>0_def by auto
+
+  have "?P t" using assms by simp
+  with not_P have "t\<^sub>0 \<le> t" using leI by blast
+  then obtain b\<^sub>0 where b0: "prefixes t\<^sub>0 j \<down>= b\<^sub>0"
+    using assms(1) prefixes_converg_le by blast
+
+  have "eval ?f [t\<^sub>0, j, x] \<down>= 0"
+  proof -
+    have "eval (Cn 3 r_prefixes [Id 3 0, Id 3 1]) [t\<^sub>0, j, x] \<down>= b\<^sub>0"
+      using b0 by simp
+    then show ?thesis using `?P t\<^sub>0` by simp
+  qed
+  moreover have "eval ?f [t, j, x] \<down>\<noteq> 0" if "t < t\<^sub>0" for t
+  proof -
+    obtain bt where bt: "prefixes t j \<down>= bt"
+      using prefixes_converg_le[of t\<^sub>0 j t] b0 `t < t\<^sub>0` by auto
+    moreover have "\<not> ?P t"
+      using that not_P by simp
+    ultimately have "e_length bt \<le> x" by simp
+    moreover have "eval (Cn 3 r_prefixes [Id 3 0, Id 3 1]) [t, j, x] \<down>= bt"
+      using bt by simp
+    ultimately show ?thesis by simp
+  qed
+  ultimately have "eval (Mn 2 ?f) [j, x] \<down>= t\<^sub>0"
+    using eval_Mn_convergI[of 2 ?f "[j, x]" t\<^sub>0] by simp
+  then have "\<psi> j x \<down>= e_nth b\<^sub>0 x"
+    unfolding r_psi_def using b0 by simp
+  then show ?thesis
+    using `t\<^sub>0 \<le> t` assms(1) prefixes_stable[of t\<^sub>0 j b\<^sub>0 "t - t\<^sub>0" b] b0 `?P t\<^sub>0`
+    by simp
+qed
+
+lemma psi_converg_imp_prefix:
+  assumes "\<psi> j x \<down>"
+  shows "\<exists>t b. prefixes t j \<down>= b \<and> e_length b > x"
+proof -
+  let ?f = "Cn 3 r_less [Id 3 2, Cn 3 r_length [Cn 3 r_prefixes [Id 3 0, Id 3 1]]]"
+  have "eval (Mn 2 ?f) [j, x] \<down>"
+  proof (rule ccontr)
+    assume "\<not> eval (Mn 2 ?f) [j, x] \<down>"
+    then have "eval (Mn 2 ?f) [j, x] \<up>" by simp
+    then have "\<psi> j x \<up>"
+      unfolding r_psi_def by simp
+    then show False
+      using assms by simp
+  qed
+  then obtain t where t: "eval (Mn 2 ?f) [j, x] \<down>= t"
+    by blast
+  have "recfn 2 (Mn 2 ?f)" by simp
+  then have f_zero: "eval ?f [t, j, x] \<down>= 0"
+    using eval_Mn_convergE[OF _ t]
+    by (metis (no_types, lifting) One_nat_def Suc_1 length_Cons list.size(3))
+  have "prefixes t j \<down>"
+  proof (rule ccontr)
+    assume "\<not> prefixes t j \<down>"
+    then have "prefixes t j \<up>" by simp
+    then have "eval ?f [t, j, x] \<up>" by simp
+    with f_zero show False by simp
+  qed
+  then obtain b' where b': "prefixes t j \<down>= b'" by auto
+  moreover have "e_length b' > x"
+  proof (rule ccontr)
+    assume "\<not> e_length b' > x"
+    then have "eval ?f [t, j, x] \<down>= 1"
+      using b' by simp
+    with f_zero show False by simp
+  qed
+  ultimately show ?thesis by auto
+qed
+
+lemma psi_converg_imp_prefix':
+  assumes "\<psi> j x \<down>"
+  shows "\<exists>t b. prefixes t j \<down>= b \<and> e_length b > x \<and> \<psi> j x \<down>= e_nth b x"
+  using psi_converg_imp_prefix[OF assms] psi_eq_nth_prefix by blast
+
+text \<open>In both Case~1 and~2, $\psi_j$ starts with $j$.\<close>
+
+lemma psi_at_0: "\<psi> j 0 \<down>= j"
+  using prefixes_hd prefixes_length psi_eq_nth_prefix prefixes_at_0 by fastforce
+
+text \<open>In Case~1, $\psi_j$ is total and made up of $j$ followed by zeros
+and ones, just as required by the definition of $V_1$.\<close>
+
+lemma case_one_psi_total:
+  assumes "case_one j" and "x > 0"
+  shows "\<psi> j x \<down>= 0 \<or> \<psi> j x \<down>= 1"
+proof -
+  obtain b where b: "prefixes x j \<down>= b"
+    using assms(1) by auto
+  then have "e_length b > x"
+    using prefixes_length by simp
+  then have "\<psi> j x \<down>= e_nth b x"
+    using b psi_eq_nth_prefix by simp
+  moreover have "e_nth b x = 0 \<or> e_nth b x = 1"
+    using prefixes_tl_only_01[OF b] assms(2) by simp
+  ultimately show "\<psi> j x \<down>= 0 \<or> \<psi> j x \<down>= 1"
+    by simp
+qed
+
+text \<open>In Case~2, $\psi_j$ is defined only for a prefix starting with
+$j$ and continuing with zeros and ones. This prefix corresponds to $ja$ from
+the definition of $V_2$.\<close>
+
+lemma case_two_psi_only_prefix:
+  assumes "case_two j"
+  shows "\<exists>y. (\<forall>x. 0 < x \<and> x < y \<longrightarrow> \<psi> j x \<down>= 0 \<or> \<psi> j x \<down>= 1) \<and>
+                (\<forall>x \<ge> y. \<psi> j x \<up>)"
+proof -
+  obtain t where
+    t_le: "\<forall>t'\<le>t. prefixes t' j \<down>" and
+    t_gr: "\<forall>t'>t. prefixes t' j \<up>"
+    using assms case_two by blast
+  then obtain b where b: "prefixes t j \<down>= b"
+    by auto
+  let ?y = "e_length b"
+  have "\<psi> j x \<down>= 0 \<or> \<psi> j x \<down>= 1" if "x > 0 \<and> x < ?y" for x
+    using t_le b that by (metis prefixes_tl_only_01 psi_eq_nth_prefix)
+  moreover have "\<psi> j x \<up>" if "x \<ge> ?y" for x
+  proof (rule ccontr)
+    assume "\<psi> j x \<down>"
+    then obtain t' b' where t': "prefixes t' j \<down>= b'" and "e_length b' > x"
+      using psi_converg_imp_prefix by blast
+    then have "e_length b' > ?y"
+      using that by simp
+    with t' have "t' > t"
+      using prefixes_monotone b by (metis add_diff_inverse_nat leD)
+    with t' t_gr show False by simp
+  qed
+  ultimately show ?thesis by auto
+qed
+
+definition longest_prefix :: "nat \<Rightarrow> nat" where
+  "longest_prefix j \<equiv> THE y. (\<forall>x<y. \<psi> j x \<down>) \<and> (\<forall>x\<ge>y. \<psi> j x \<up>)"
+
+lemma longest_prefix:
+  assumes "case_two j" and "z = longest_prefix j"
+  shows "(\<forall>x<z. \<psi> j x \<down>) \<and> (\<forall>x\<ge>z. \<psi> j x \<up>)"
+proof -
+  let ?P = "\<lambda>z. (\<forall>x<z. \<psi> j x \<down>) \<and> (\<forall>x\<ge>z. \<psi> j x \<up>)"
+  obtain y where y:
+    "\<forall>x. 0 < x \<and> x < y \<longrightarrow> \<psi> j x \<down>= 0 \<or> \<psi> j x \<down>= 1"
+    "\<forall>x\<ge>y. \<psi> j x \<up>"
+    using case_two_psi_only_prefix[OF assms(1)] by auto
+  have "?P (THE z. ?P z)"
+  proof (rule theI[of ?P y])
+    show "?P y"
+    proof
+      show "\<forall>x<y. \<psi> j x \<down>"
+      proof (rule allI, rule impI)
+        fix x assume "x < y"
+        show "\<psi> j x \<down>"
+        proof (cases "x = 0")
+          case True
+          then show ?thesis using psi_at_0 by simp
+        next
+          case False
+          then show ?thesis using y(1) `x < y` by auto
+        qed
+      qed
+      show "\<forall>x\<ge>y. \<psi> j x \<up>" using y(2) by simp
+    qed
+    show "z = y" if "?P z" for z
+    proof (rule ccontr, cases "z < y")
+      case True
+      moreover assume "z \<noteq> y"
+      ultimately show False
+        using that `?P y` by auto
+    next
+      case False
+      moreover assume "z \<noteq> y"
+      then show False
+        using that `?P y` y(2) by (meson linorder_cases order_refl)
+    qed
+  qed
+  then have "(\<forall>x<(THE z. ?P z). \<psi> j x \<down>) \<and> (\<forall>x\<ge>(THE z. ?P z). \<psi> j x \<up>)"
+    by blast
+  moreover have "longest_prefix j = (THE z. ?P z)"
+    unfolding longest_prefix_def by simp
+  ultimately show ?thesis using assms(2) by metis
+qed
+
+lemma case_two_psi_longest_prefix:
+  assumes "case_two j" and "y = longest_prefix j"
+  shows "(\<forall>x. 0 < x \<and> x < y \<longrightarrow> \<psi> j x \<down>= 0 \<or> \<psi> j x \<down>= 1) \<and>
+    (\<forall>x \<ge> y. \<psi> j x \<up>)"
+  using assms longest_prefix case_two_psi_only_prefix
+  by (metis prefixes_tl_only_01 psi_converg_imp_prefix')
+
+text \<open>The prefix cannot be empty because the process starts with prefix $[j]$.\<close>
+
+lemma longest_prefix_gr_0:
+  assumes "case_two j"
+  shows "longest_prefix j > 0"
+  using assms case_two_psi_longest_prefix psi_at_0 by force
+
+lemma psi_not_divergent_init:
+  assumes "prefixes t j \<down>= b"
+  shows "(\<psi> j) \<triangleright> (e_length b - 1) = b"
+proof (intro initI)
+  show "0 < e_length b"
+    using assms prefixes_length by fastforce
+  show "\<psi> j x \<down>= e_nth b x" if "x < e_length b" for x
+    using that assms psi_eq_nth_prefix by simp
+qed
+
+text \<open>In Case~2, the strategy $S$ outputs a non-total hypothesis on
+some prefix of $\psi_j$.\<close>
+
+lemma case_two_nontotal_hyp:
+  assumes "case_two j"
+  shows "\<exists>n<longest_prefix j. \<not> total1 (\<phi> (the (s ((\<psi> j) \<triangleright> n))))"
+proof -
+  obtain t where "\<forall>t'\<le>t. prefixes t' j \<down>" and t_gr: "\<forall>t'>t. prefixes t' j \<up>"
+    using assms case_two by blast
+  then obtain b where b: "prefixes t j \<down>= b"
+    by auto
+  moreover obtain i where i: "s b \<down>= i"
+    using eval_rs by fastforce
+  moreover have div: "prefixes (Suc t) j \<up>"
+    using t_gr by simp
+  ultimately have "\<exists>x. \<phi> i x \<up>"
+    using prefixes_nontotal_hyp by simp
+  then obtain x where "\<phi> i x \<up>" by auto
+  moreover have init: "\<psi> j \<triangleright> (e_length b - 1) = b" (is "_ \<triangleright> ?n = b")
+    using psi_not_divergent_init[OF b] by simp
+  ultimately have "\<phi> (the (s (\<psi> j \<triangleright> ?n))) x \<up>"
+    using i by simp
+  then have "\<not> total1 (\<phi> (the (s (\<psi> j \<triangleright> ?n))))"
+    by auto
+  moreover have "?n < longest_prefix j"
+    using case_two_psi_longest_prefix init b div psi_eq_nth_prefix
+    by (metis length_init lessI not_le_imp_less option.simps(3))
+  ultimately show ?thesis by auto
+qed
+
+text \<open>Consequently, in Case~2 the strategy does not TOTAL-learn
+any function starting with the longest prefix of $\psi_j$.\<close>
+
+lemma case_two_not_learn:
+  assumes "case_two j"
+    and "f \<in> \<R>"
+    and "\<And>x. x < longest_prefix j \<Longrightarrow> f x = \<psi> j x"
+  shows "\<not> learn_total \<phi> {f} s"
+proof -
+  obtain n where n:
+    "n < longest_prefix j"
+    "\<not> total1 (\<phi> (the (s (\<psi> j \<triangleright> n))))"
+    using case_two_nontotal_hyp[OF assms(1)] by auto
+  have "f \<triangleright> n = \<psi> j \<triangleright> n"
+    using assms(3) n(1) by (intro init_eqI) auto
+  with n(2) show ?thesis by (metis R1_imp_total1 learn_totalE(3) singletonI)
+qed
+
+text \<open>In Case~1 the strategy outputs a wrong hypothesis
+on infinitely many prefixes of $\psi_j$ and thus does not
+learn $\psi_j$ in the limit, much less in the sense of TOTAL.\<close>
+
+lemma case_one_wrong_hyp:
+  assumes "case_one j"
+  shows "\<exists>n>k. \<phi> (the (s ((\<psi> j) \<triangleright> n))) \<noteq> \<psi> j"
+proof -
+  have all_t: "\<forall>t. prefixes t j \<down>"
+    using assms by simp
+  then obtain b where b: "prefixes (Suc k) j \<down>= b"
+    by auto
+  then have length: "e_length b > Suc k"
+    using prefixes_length by simp
+  then have init: "\<psi> j \<triangleright> (e_length b - 1) = b"
+    using psi_not_divergent_init b by simp
+  obtain i where i: "s b \<down>= i"
+    using eval_rs by fastforce
+  from all_t obtain b' where b': "prefixes (Suc (Suc k)) j \<down>= b'"
+    by auto
+  then have "\<psi> j \<triangleright> (e_length b' - 1) = b'"
+    using psi_not_divergent_init by simp
+  moreover have "\<exists>y<e_length b'. \<phi> i y \<down>\<noteq> e_nth b' y"
+    using nxt_wrong_hyp b b' i prefixes_at_Suc by auto
+  ultimately have "\<exists>y<e_length b'. \<phi> i y \<noteq> \<psi> j y"
+    using b' psi_eq_nth_prefix by auto
+  then have "\<phi> i \<noteq> \<psi> j" by auto
+  then show ?thesis
+    using init length i by (metis Suc_less_eq length_init option.sel)
+qed
+
+lemma case_one_not_learn:
+  assumes "case_one j"
+  shows "\<not> learn_lim \<phi> {\<psi> j} s"
+proof (rule infinite_hyp_wrong_not_Lim[of "\<psi> j"])
+  show "\<psi> j \<in> {\<psi> j}" by simp
+  show "\<forall>n. \<exists>m>n. \<phi> (the (s (\<psi> j \<triangleright> m))) \<noteq> \<psi> j"
+    using case_one_wrong_hyp[OF assms] by simp
+qed
+
+lemma case_one_not_learn_V:
+  assumes "case_one j" and "j \<ge> 2" and "\<phi> j = \<psi> j"
+  shows "\<not> learn_lim \<phi> V_constotal s"
+proof -
+  have "\<psi> j \<in> V_constotal_1"
+  proof -
+    define p where "p = (\<lambda>x. (\<psi> j) (x + 1))"
+    have "p \<in> \<R>\<^sub>0\<^sub>1"
+    proof -
+      from p_def have "p \<in> \<P>"
+        using skip_P1[of "\<psi> j" 1] psi_in_P2 P2_proj_P1 by blast
+      moreover have "p x \<down>= 0 \<or> p x \<down>= 1" for x
+        using p_def assms(1) case_one_psi_total by auto
+      moreover from this have "total1 p" by fast
+      ultimately show ?thesis using RPred1_def by auto
+    qed
+    moreover have "\<psi> j = [j] \<odot> p"
+      by (intro prepend_eqI, simp add: psi_at_0, simp add: p_def)
+    ultimately show ?thesis using assms(2,3) V_constotal_1_def by blast
+  qed
+  then have "\<psi> j \<in> V_constotal" using V_constotal_def by auto
+  moreover have "\<not> learn_lim \<phi> {\<psi> j} s"
+    using case_one_not_learn assms(1) by simp
+  ultimately show ?thesis using learn_lim_closed_subseteq by auto
+qed
+
+text \<open>The next lemma embodies the construction of $\chi$ followed by
+the application of Kleene's fixed-point theorem as described in the
+proof sketch.\<close>
+
+lemma goedel_after_prefixes:
+  fixes vs :: "nat list" and m :: nat
+  shows "\<exists>n\<ge>m. \<phi> n = vs @ [n] \<odot> 0\<^sup>\<infinity>"
+proof -
+  define f :: partial1 where "f \<equiv> vs \<odot> 0\<^sup>\<infinity>"
+  then have "f \<in> \<R>"
+    using almost0_in_R1 by auto
+  then obtain n where n:
+    "n \<ge> m"
+    "\<phi> n = (\<lambda>x. if x = length vs then Some n else f x)"
+    using goedel_at[of f m "length vs"] by auto
+  moreover have "\<phi> n x = (vs @ [n] \<odot> 0\<^sup>\<infinity>) x" for x
+  proof -
+    consider "x < length vs" | "x = length vs" | "x > length vs"
+      by linarith
+    then show ?thesis
+      using n f_def by (cases) (auto simp add: prepend_associative)
+  qed
+  ultimately show ?thesis by blast
+qed
+
+text \<open>If Case~2 holds for a $j\geq 2$ with $\varphi_j = \psi_j$, that
+is, if $\psi_j\in V_1$, then there is a function in $V$, namely $\psi_j$, on
+which $S$ fails. Therefore $S$ does not learn $V$.\<close>
+
+lemma case_two_not_learn_V:
+  assumes "case_two j" and "j \<ge> 2" and "\<phi> j = \<psi> j"
+  shows "\<not> learn_total \<phi> V_constotal s"
+proof -
+  define z where "z = longest_prefix j"
+  then have "z > 0"
+    using longest_prefix_gr_0[OF assms(1)] by simp
+  define vs where "vs = prefix (\<psi> j) (z - 1)"
+  then have "vs ! 0 = j"
+    using psi_at_0 `z > 0` by simp
+  define a where "a = tl vs"
+  then have vs: "vs = j # a"
+    using vs_def `vs ! 0 = j`
+    by (metis length_Suc_conv length_prefix list.sel(3) nth_Cons_0)
+  obtain k where k: "k \<ge> 2" and phi_k: "\<phi> k = j # a @ [k] \<odot> 0\<^sup>\<infinity>"
+    using goedel_after_prefixes[of 2 "j # a"] by auto
+  have phi_j: "\<phi> j = j # a \<odot> \<up>\<^sup>\<infinity> "
+  proof (rule prepend_eqI)
+    show "\<And>x. x < length (j # a) \<Longrightarrow> \<phi> j x \<down>= (j # a) ! x"
+      using assms(1,3) vs vs_def \<open>0 < z\<close>
+        length_prefix[of "\<psi> j" "z - 1"]
+        prefix_nth[of _ _ "\<psi> j"]
+        psi_at_0[of j]
+        case_two_psi_longest_prefix[OF _ z_def]
+        longest_prefix[OF _ z_def]
+      by (metis One_nat_def Suc_pred option.collapse)
+    show "\<And>x. \<phi> j (length (j # a) + x) \<up>"
+      using assms(3) vs_def
+      by (simp add: vs assms(1) case_two_psi_longest_prefix z_def)
+  qed
+  moreover have "\<phi> k \<in> V_constotal_2"
+  proof (intro V_constotal_2I[of _ j a k])
+    show "\<phi> k = j # a @ [k] \<odot> 0\<^sup>\<infinity>"
+      using phi_k .
+    show "2 \<le> j"
+      using `2 \<le> j` .
+    show "2 \<le> k"
+      using `2 \<le> k` .
+    show "\<forall>i<length a. a ! i \<le> 1"
+    proof (rule allI, rule impI)
+      fix i assume i: "i < length a"
+      then have "Suc i < z"
+        using z_def vs_def length_prefix \<open>0 < z\<close> vs
+        by (metis One_nat_def Suc_mono Suc_pred length_Cons)
+      have "a ! i = vs ! (Suc i)"
+        using vs by simp
+      also have "... = the (\<psi> j (Suc i))"
+        using vs_def vs i length_Cons length_prefix prefix_nth
+        by (metis Suc_mono)
+      finally show "a ! i \<le> 1"
+        using case_two_psi_longest_prefix `Suc i < z` z_def
+        by (metis assms(1) less_or_eq_imp_le not_le_imp_less not_one_less_zero
+          option.sel zero_less_Suc)
+    qed
+  qed (auto simp add: phi_j)
+  then have "\<phi> k \<in> V_constotal"
+    using V_constotal_def by auto
+  moreover have "\<not> learn_total \<phi> {\<phi> k} s"
+  proof -
+    have "\<phi> k \<in> \<R>"
+      by (simp add: phi_k almost0_in_R1)
+    moreover have "\<And>x. x < longest_prefix j \<Longrightarrow> \<phi> k x = \<psi> j x"
+      using phi_k vs_def z_def length_prefix phi_j prepend_associative prepend_at_less
+      by (metis One_nat_def Suc_pred \<open>0 < z\<close> \<open>vs = j # a\<close> append_Cons assms(3))
+    ultimately show ?thesis
+      using case_two_not_learn[OF assms(1)] by simp
+  qed
+  ultimately show "\<not> learn_total \<phi> V_constotal s"
+    using learn_total_closed_subseteq by auto
+qed
+
+text \<open>The strategy $S$ does not learn $V$ in either case.\<close>
+
+lemma not_learn_total_V: "\<not> learn_total \<phi> V_constotal s"
+proof -
+  obtain j where "j \<ge> 2" "\<phi> j = \<psi> j"
+    using kleene_fixed_point psi_in_P2 by auto
+  then show ?thesis
+    using case_one_not_learn_V learn_total_def case_two_not_learn_V
+    by (cases "case_two j") auto
+qed
+
+end
+
+
+lemma V_not_in_TOTAL: "V_constotal \<notin> TOTAL"
+proof (rule ccontr)
+  assume "\<not> V_constotal \<notin> TOTAL"
+  then have "V_constotal \<in> TOTAL" by simp
+  then have "V_constotal \<in> TOTAL_wrt \<phi>"
+    by (simp add: TOTAL_wrt_phi_eq_TOTAL)
+  then obtain s where "learn_total \<phi> V_constotal s"
+    using TOTAL_wrt_def by auto
+  then obtain s' where s': "s' \<in> \<R>" "learn_total \<phi> V_constotal s'"
+    using lemma_R_for_TOTAL_simple by blast
+  then interpret total_cons s'
+    by (simp add: total_cons_def)
+  have "\<not> learn_total \<phi> V_constotal s'"
+    by (simp add: not_learn_total_V)
+  with s'(2) show False by simp
+qed
+
+lemma TOTAL_neq_CONS: "TOTAL \<noteq> CONS"
+  using V_not_in_TOTAL V_in_CONS CONS_def by auto
+
+text \<open>The main result of this section:\<close>
+
+theorem TOTAL_subset_CONS: "TOTAL \<subset> CONS"
+  using TOTAL_subseteq_CONS TOTAL_neq_CONS by simp
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/Union.thy b/thys/Inductive_Inference/Union.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/Union.thy
@@ -0,0 +1,283 @@
+section \<open>The union of classes\label{s:union}\<close>
+
+theory Union
+  imports R1_BC TOTAL_CONS
+begin
+
+text \<open>None of the inference types introduced in this chapter are closed
+under union of classes. For all inference types except FIN this follows from
+@{thm[source] "U0_V0_not_in_BC"}.\<close>
+
+lemma not_closed_under_union:
+  "\<forall>\<I>\<in>{CP, TOTAL, CONS, LIM, BC}. U\<^sub>0 \<in> \<I> \<and> V\<^sub>0 \<in> \<I> \<and> U\<^sub>0 \<union> V\<^sub>0 \<notin> \<I>"
+  using U0_in_CP U0_in_NUM V0_in_FIN
+    FIN_subseteq_CP
+    NUM_subseteq_TOTAL
+    CP_subseteq_TOTAL
+    TOTAL_subseteq_CONS
+    CONS_subseteq_Lim
+    Lim_subseteq_BC
+    U0_V0_not_in_BC
+  by blast
+
+text \<open>In order to show the analogous result for FIN consider the
+classes $\{0^\infty\}$ and $\{0^n10^\infty \mid n \in \mathbb{N}\}$. The
+former can be learned finitely by a strategy that hypothesizes $0^\infty$ for
+every input. The latter can be learned finitely by a strategy that waits for
+the 1 and hypothesizes the only function in the class with a 1 at that
+position. However, the union of both classes is not in FIN. This is because
+any FIN strategy has to hypothesize $0^\infty$ on some prefix of the form
+$0^n$. But the strategy then fails for the function $0^n10^\infty$.\<close>
+
+lemma singleton_in_FIN: "f \<in> \<R> \<Longrightarrow> {f} \<in> FIN"
+proof -
+  assume "f \<in> \<R>"
+  then obtain i where i: "\<phi> i = f"
+    using phi_universal by blast
+  define s :: partial1 where "s = (\<lambda>_. Some (Suc i))"
+  then have "s \<in> \<R>"
+    using const_in_Prim1[of "Suc i"] by simp
+  have "learn_fin \<phi> {f} s"
+  proof (intro learn_finI)
+    show "environment \<phi> {f} s"
+      using `s \<in> \<R>` `f \<in> \<R>` by (simp add: phi_in_P2)
+    show "\<exists>i n\<^sub>0. \<phi> i = g \<and> (\<forall>n<n\<^sub>0. s (g \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (g \<triangleright> n) \<down>= Suc i)"
+      if "g \<in> {f}" for g
+    proof -
+      from that have "g = f" by simp
+      then have "\<phi> i = g"
+        using i by simp
+      moreover have "\<forall>n<0. s (g \<triangleright> n) \<down>= 0" by simp
+      moreover have "\<forall>n\<ge>0. s (g \<triangleright> n) \<down>= Suc i"
+        using s_def by simp
+      ultimately show ?thesis by auto
+    qed
+  qed
+  then show "{f} \<in> FIN" using FIN_def by auto
+qed
+
+definition U_single :: "partial1 set" where
+  "U_single \<equiv> {(\<lambda>x. if x = n then Some 1 else Some 0)| n. n \<in> UNIV}"
+
+lemma U_single_in_FIN: "U_single \<in> FIN"
+proof -
+  define psi :: partial2 where "psi \<equiv> \<lambda>n x. if x = n then Some 1 else Some 0"
+  have "psi \<in> \<R>\<^sup>2"
+    using psi_def by (intro R2I[of "Cn 2 r_not [r_eq]"]) auto
+  define s :: partial1 where
+    "s \<equiv> \<lambda>b. if findr b \<down>= e_length b then Some 0 else Some (Suc (the (findr b)))"
+  have "s \<in> \<R>"
+  proof (rule R1I)
+    let ?r = "Cn 1 r_ifeq [r_findr, r_length, Z, Cn 1 S [r_findr]]"
+    show "recfn 1 ?r" by simp
+    show "total ?r" by auto
+    show "eval ?r [b] = s b" for b
+    proof -
+      let ?b = "the (findr b)"
+      have "eval ?r [b] = (if ?b = e_length b then Some 0 else Some (Suc (?b)))"
+        using findr_total by simp
+      then show "eval ?r [b] = s b"
+        by (metis findr_total option.collapse option.inject s_def)
+    qed
+  qed
+  have "U_single \<subseteq> \<R>"
+  proof
+    fix f
+    assume "f \<in> U_single"
+    then obtain n where "f = (\<lambda>x. if x = n then Some 1 else Some 0)"
+      using U_single_def by auto
+    then have "f = psi n"
+      using psi_def by simp
+    then show "f \<in> \<R>"
+      using `psi \<in> \<R>\<^sup>2` by simp
+  qed
+  have "learn_fin psi U_single s"
+  proof (rule learn_finI)
+    show "environment psi U_single s"
+      using `psi \<in> \<R>\<^sup>2` `s \<in> \<R>` `U_single \<subseteq> \<R>` by simp
+    show "\<exists>i n\<^sub>0. psi i = f \<and> (\<forall>n<n\<^sub>0. s (f \<triangleright> n) \<down>= 0) \<and> (\<forall>n\<ge>n\<^sub>0. s (f \<triangleright> n) \<down>= Suc i)"
+      if "f \<in> U_single" for f
+    proof -
+      from that obtain i where i: "f = (\<lambda>x. if x = i then Some 1 else Some 0)"
+        using U_single_def by auto
+      then have "psi i = f"
+        using psi_def by simp
+      moreover have "\<forall>n<i. s (f \<triangleright> n) \<down>= 0"
+        using i s_def findr_def by simp
+      moreover have "\<forall>n\<ge>i. s (f \<triangleright> n) \<down>= Suc i"
+      proof (rule allI, rule impI)
+        fix n
+        assume "n \<ge> i"
+        let ?e = "init f n"
+        have "\<exists>i<e_length ?e. e_nth ?e i \<noteq> 0"
+          using `n \<ge> i` i by simp
+        then have less: "the (findr ?e) < e_length ?e"
+          and nth_e: "e_nth ?e (the (findr ?e)) \<noteq> 0"
+          using findr_ex by blast+
+        then have "s ?e \<down>= Suc (the (findr ?e))"
+          using s_def by auto
+        moreover have "the (findr ?e) = i"
+          using nth_e less i by (metis length_init nth_init option.sel)
+        ultimately show "s ?e \<down>= Suc i" by simp
+      qed
+      ultimately show ?thesis by auto
+    qed
+  qed
+  then show "U_single \<in> FIN" using FIN_def by blast
+qed
+
+lemma zero_U_single_not_in_FIN: "{0\<^sup>\<infinity>} \<union> U_single \<notin> FIN"
+proof
+  assume "{0\<^sup>\<infinity>} \<union> U_single \<in> FIN"
+  then obtain psi s where learn: "learn_fin psi ({0\<^sup>\<infinity>} \<union> U_single) s"
+    using FIN_def by blast
+  then have "learn_fin psi {0\<^sup>\<infinity>} s"
+    using learn_fin_closed_subseteq by auto
+  then obtain i n\<^sub>0 where i:
+    "psi i = 0\<^sup>\<infinity>"
+    "\<forall>n<n\<^sub>0. s (0\<^sup>\<infinity> \<triangleright> n) \<down>= 0"
+    "\<forall>n\<ge>n\<^sub>0. s (0\<^sup>\<infinity> \<triangleright> n) \<down>= Suc i"
+    using learn_finE(2) by blast
+  let ?f = "\<lambda>x. if x = Suc n\<^sub>0 then Some 1 else Some 0"
+  have "?f \<noteq> 0\<^sup>\<infinity>" by (metis option.inject zero_neq_one)
+  have "?f \<in> U_single"
+    using U_single_def by auto
+  then have "learn_fin psi {?f} s"
+    using learn learn_fin_closed_subseteq by simp
+  then obtain j m\<^sub>0 where j:
+    "psi j = ?f"
+    "\<forall>n<m\<^sub>0. s (?f \<triangleright> n) \<down>= 0"
+    "\<forall>n\<ge>m\<^sub>0. s (?f \<triangleright> n) \<down>= Suc j"
+    using learn_finE(2) by blast
+  consider
+    (less) "m\<^sub>0 < n\<^sub>0" | (eq) "m\<^sub>0 = n\<^sub>0" | (gr) "m\<^sub>0 > n\<^sub>0"
+    by linarith
+  then show False
+  proof (cases)
+    case less
+    then have "s (0\<^sup>\<infinity>\<triangleright> m\<^sub>0) \<down>= 0"
+      using i by simp
+    moreover have "0\<^sup>\<infinity> \<triangleright> m\<^sub>0 = ?f \<triangleright> m\<^sub>0"
+      using less init_eqI[of m\<^sub>0 ?f "0\<^sup>\<infinity>"] by simp
+    ultimately have "s (?f \<triangleright> m\<^sub>0) \<down>= 0" by simp
+    then show False using j by simp
+  next
+    case eq
+    then have "0\<^sup>\<infinity> \<triangleright> m\<^sub>0 = ?f \<triangleright> m\<^sub>0"
+      using init_eqI[of m\<^sub>0 ?f "0\<^sup>\<infinity>"] by simp
+    then have "s (0\<^sup>\<infinity> \<triangleright> m\<^sub>0) = s (?f \<triangleright> m\<^sub>0)" by simp
+    then have "i = j"
+      using i j eq by simp
+    then have "psi i = psi j" by simp
+    then show False using `?f \<noteq> 0\<^sup>\<infinity>` i j by simp
+  next
+    case gr
+    have "0\<^sup>\<infinity> \<triangleright> n\<^sub>0 = ?f \<triangleright> n\<^sub>0"
+      using init_eqI[of n\<^sub>0 ?f "0\<^sup>\<infinity>"] by simp
+    moreover have "s (0\<^sup>\<infinity> \<triangleright> n\<^sub>0) \<down>= Suc i"
+      using i by simp
+    moreover have "s (?f \<triangleright> n\<^sub>0) \<down>= 0"
+      using j gr by simp
+    ultimately show False by simp
+  qed
+qed
+
+lemma FIN_not_closed_under_union: "\<exists>U V. U \<in> FIN \<and> V \<in> FIN \<and> U \<union> V \<notin> FIN"
+proof -
+  have "{0\<^sup>\<infinity>} \<in> FIN"
+    using singleton_in_FIN const_in_Prim1 by simp
+  moreover have "U_single \<in> FIN"
+    using U_single_in_FIN by simp
+  ultimately show ?thesis
+    using zero_U_single_not_in_FIN by blast
+qed
+
+text \<open>In contrast to the inference types, NUM is closed under the union
+of classes. The total numberings that exist for each NUM class can be
+interleaved to produce a total numbering encompassing the union of the
+classes. To define the interleaving, modulo and division by two will be
+helpful.\<close>
+
+definition "r_div2 \<equiv>
+  r_shrink
+   (Pr 1 Z
+     (Cn 3 r_ifle
+       [Cn 3 r_mul [r_constn 2 2, Cn 3 S [Id 3 0]], Id 3 2, Cn 3 S [Id 3 1], Id 3 1]))"
+
+lemma r_div2_prim [simp]: "prim_recfn 1 r_div2"
+  unfolding r_div2_def by simp
+
+lemma r_div2 [simp]: "eval r_div2 [n] \<down>= n div 2"
+proof -
+  let ?p = "Pr 1 Z
+    (Cn 3 r_ifle
+      [Cn 3 r_mul [r_constn 2 2, Cn 3 S [Id 3 0]], Id 3 2, Cn 3 S [Id 3 1], Id 3 1])"
+  have "eval ?p [i, n] \<down>= min (n div 2) i" for i
+    by (induction i) auto
+  then have "eval ?p [n, n] \<down>= n div 2" by simp
+  then show ?thesis unfolding r_div2_def by simp
+qed
+
+definition "r_mod2 \<equiv> Cn 1 r_sub [Id 1 0, Cn 1 r_mul [r_const 2, r_div2]]"
+
+lemma r_mod2_prim [simp]: "prim_recfn 1 r_mod2"
+  unfolding r_mod2_def by simp
+
+lemma r_mod2 [simp]: "eval r_mod2 [n] \<down>= n mod 2"
+  unfolding r_mod2_def using Rings.semiring_modulo_class.minus_mult_div_eq_mod
+  by auto
+
+lemma NUM_closed_under_union:
+  assumes "U \<in> NUM" and "V \<in> NUM"
+  shows "U \<union> V \<in> NUM"
+proof -
+  from assms obtain psi_u psi_v where
+    psi_u: "psi_u \<in> \<R>\<^sup>2" "\<And>f. f \<in> U \<Longrightarrow> \<exists>i. psi_u i = f" and
+    psi_v: "psi_v \<in> \<R>\<^sup>2" "\<And>f. f \<in> V \<Longrightarrow> \<exists>i. psi_v i = f"
+    by fastforce
+  define psi where "psi \<equiv> \<lambda>i. if i mod 2 = 0 then psi_u (i div 2) else psi_v (i div 2)"
+  from psi_u(1) obtain u where u: "recfn 2 u" "total u" "\<And>x y. eval u [x, y] = psi_u x y"
+    by auto
+  from psi_v(1) obtain v where v: "recfn 2 v" "total v" "\<And>x y. eval v [x, y] = psi_v x y"
+    by auto
+  let ?r_psi = "Cn 2 r_ifz
+    [Cn 2 r_mod2 [Id 2 0],
+     Cn 2 u [Cn 2 r_div2 [Id 2 0], Id 2 1],
+     Cn 2 v [Cn 2 r_div2 [Id 2 0], Id 2 1]]"
+  show ?thesis
+  proof (rule NUM_I[of psi])
+    show "psi \<in> \<R>\<^sup>2"
+    proof (rule R2I)
+      show "recfn 2 ?r_psi"
+        using u(1) v(1) by simp
+      show "eval ?r_psi [x, y] = psi x y" for x y
+        using u v psi_def prim_recfn_total R2_imp_total2[OF psi_u(1)]
+          R2_imp_total2[OF psi_v(1)]
+        by simp
+      moreover have "psi x y \<down>" for x y
+        using psi_def psi_u(1) psi_v(1) by simp
+      ultimately show "total ?r_psi"
+        using `recfn 2 ?r_psi` totalI2 by simp
+    qed
+    show "\<exists>i. psi i = f" if "f \<in> U \<union> V" for f
+    proof (cases "f \<in> U")
+      case True
+      then obtain j where "psi_u j = f"
+        using psi_u(2) by auto
+      then have "psi (2 * j) = f"
+        using psi_def by simp
+      then show ?thesis by auto
+    next
+      case False
+      then have "f \<in> V"
+        using that by simp
+      then obtain j where "psi_v j = f"
+        using psi_v(2) by auto
+      then have "psi (Suc (2 * j)) = f"
+        using psi_def by simp
+      then show ?thesis by auto
+    qed
+  qed
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/Universal.thy b/thys/Inductive_Inference/Universal.thy
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/Universal.thy
@@ -0,0 +1,2537 @@
+section \<open>A universal partial recursive function\<close>
+
+theory Universal
+  imports Partial_Recursive
+begin
+
+text \<open>The main product of this section is a universal partial recursive
+function, which given a code $i$ of an $n$-ary partial recursive function $f$
+and an encoded list @{term xs} of $n$ arguments, computes @{term "eval f
+xs"}. From this we can derive fixed-arity universal functions satisfying the
+usual results such as the $s$-$m$-$n$ theorem. To represent the code $i$, we
+need a way to encode @{typ recf}s as natural numbers (Section~\ref{s:recf_enc}). To
+construct the universal function, we devise a ternary function taking $i$,
+$xs$, and a step bound $t$ and simulating the execution of $f$ on input $xs$ for
+$t$ steps. This function is useful in its own right, enabling techniques like
+dovetailing or ``concurrent'' evaluation of partial recursive functions.
+
+The notion of a ``step'' is not part of the definition of (the evaluation of)
+partial recursive functions, but one can simulate the evaluation on an
+abstract machine (Section~\ref{s:step}). This machine's configurations can be
+encoded as natural numbers, and this leads us to a step function @{typ "nat
+\<Rightarrow> nat"} on encoded configurations (Section~\ref{s:step_enc}).
+This function in turn can be computed by a primitive recursive function, from
+which we develop the aforementioned ternary function of $i$, @{term xs}, and
+$t$ (Section~\ref{s:step_recf}). From this we can finally derive
+a universal function (Section~\ref{s:the_universal}).\<close>
+
+subsection \<open>A step function\label{s:step}\<close>
+
+text \<open>We simulate the stepwise execution of a partial recursive
+function in a fairly straightforward way reminiscent of the execution of
+function calls in an imperative programming language. A configuration of the
+abstract machine is a pair consisting of:
+\begin{enumerate}
+\item A stack of frames. A frame represents the execution of a function and is
+  a triple @{term "(f, xs, locals)"} of
+  \begin{enumerate}
+    \item a @{typ recf} @{term f} being executed,
+    \item a @{typ "nat list"} of arguments of @{term f},
+    \item a @{typ "nat list"} of local variables, which holds intermediate
+      values when @{term f} is of the form @{term Cn}, @{term Pr}, or @{term Mn}.
+  \end{enumerate}
+\item A register of type @{typ "nat option"} representing the return value of
+  the last function call: @{term None} signals that in the previous step the
+  stack was not popped and hence no value was returned, whereas @{term "Some
+  v"} means that in the previous step a function returned @{term v}.
+\end{enumerate}
+For computing @{term h} on input @{term xs}, the initial configuration is
+@{term "([(h, xs, [])], None)"}. When the computation for a frame ends, it is
+popped off the stack, and its return value is put in the register. The entire
+computation ends when the stack is empty. In such a final configuration the
+register contains the value of @{term h} at @{term xs}. If no final
+configuration is ever reached, @{term h} diverges at @{term xs}.
+
+The execution of one step depends on the topmost (that is, active) frame. In
+the step when a frame @{term "(h, xs, locals)"} is pushed onto the stack, the
+local variables are @{term "locals = []"}. The following happens until the
+frame is popped off the stack again (if it ever is):
+\begin{itemize}
+\item For the base functions @{term "h = Z"}, @{term "h = S"},
+  @{term[names_short] "h = Id m n"}, the frame is popped off the stack right away,
+  and the return value is placed in the register.
+\item For @{term "h = Cn n f gs"}, for each function $g$ in @{term gs}:
+  \begin{enumerate}
+  \item A new frame of the form @{term "(g, xs, [])"} is pushed onto the stack.
+  \item When (and if) this frame
+    is eventually popped, the value in the register is @{term "eval g xs"}. This value
+    is appended to the list @{term locals} of local variables.
+  \end{enumerate}
+  When all $g$ in $gs$ have been evaluated in this manner, $f$ is evaluated on the local variables
+  by pushing @{term "(f, locals, [])"}. The resulting register value is kept
+  and the active frame for $h$ is popped off the stack.
+\item For @{text "h = Pr n f g"}, let @{term "xs = y # ys"}. First @{term "(f,
+  ys, [])"} is pushed and the return value stored in the @{term
+  locals}. Then @{term "(g, x # v # ys, [])"} is pushed,
+  where $x$ is the length of @{term locals} and $v$ the most recently
+  appended value. The return value is appended to @{term locals}. This is
+  repeated until the length of @{term locals} reaches @{term y}. Then the most
+  recently appended local is placed in the register, and the stack is popped.
+\item For @{text "h = Mn n f"}, frames @{term "(f, x # xs, [])"} are pushed
+  for $x = 0, 1, 2, \ldots$ until one of them returns $0$. Then this
+  $x$ is placed in the register and the stack is popped. Until then $x$ is
+  stored in @{term locals}. If none of these evaluations return $0$, the
+  stack never shrinks, and thus the machine never reaches a final state.
+\end{itemize}\<close>
+
+type_synonym frame = "recf \<times> nat list \<times> nat list"
+
+type_synonym configuration = "frame list \<times> nat option"
+
+
+subsubsection \<open>Definition of the step function\<close>
+
+fun step :: "configuration \<Rightarrow> configuration" where
+  "step ([], rv) = ([], rv)"
+| "step (((Z, _, _) # fs), rv) = (fs, Some 0)"
+| "step (((S, xs, _) # fs), rv) = (fs, Some (Suc (hd xs)))"
+| "step (((Id m n, xs, _) # fs), rv) = (fs, Some (xs ! n))"
+| "step (((Cn n f gs, xs, ls) # fs), rv) =
+    (if length ls = length gs
+     then if rv = None
+          then ((f, ls, []) # (Cn n f gs, xs, ls) # fs, None)
+          else (fs, rv)
+     else if rv = None
+          then if length ls < length gs
+               then ((gs ! (length ls), xs, []) # (Cn n f gs, xs, ls) # fs, None)
+               else (fs, rv)   \<comment>\<open>cannot occur, so don't-care term\<close>
+          else ((Cn n f gs, xs, ls @ [the rv]) # fs, None))"
+| "step (((Pr n f g, xs, ls) # fs), rv) =
+    (if ls = []
+     then if rv = None
+          then ((f, tl xs, []) # (Pr n f g, xs, ls) # fs, None)
+          else ((Pr n f g, xs, [the rv]) # fs, None)
+     else if length ls = Suc (hd xs)
+          then (fs, Some (hd ls))
+          else if rv = None
+               then ((g, (length ls - 1) # hd ls # tl xs, []) # (Pr n f g, xs, ls) # fs, None)
+               else ((Pr n f g, xs, (the rv) # ls) # fs, None))"
+| "step (((Mn n f, xs, ls) # fs), rv) =
+    (if ls = []
+     then ((f, 0 # xs, []) # (Mn n f, xs, [0]) # fs, None)
+     else if rv = Some 0
+          then (fs, Some (hd ls))
+          else ((f, (Suc (hd ls)) # xs, []) # (Mn n f, xs, [Suc (hd ls)]) # fs, None))"
+
+definition reachable :: "configuration \<Rightarrow> configuration \<Rightarrow> bool" where
+  "reachable x y \<equiv> \<exists>t. iterate t step x = y"
+
+lemma step_reachable [intro]:
+  assumes "step x = y"
+  shows "reachable x y"
+  unfolding reachable_def using assms by (metis iterate.simps(1,2) comp_id)
+
+lemma reachable_transitive [trans]:
+  assumes "reachable x y" and "reachable y z"
+  shows "reachable x z"
+  using assms iterate_additive[where ?f=step] reachable_def by metis
+
+lemma reachable_refl: "reachable x x"
+  unfolding reachable_def by (metis iterate.simps(1) eq_id_iff)
+
+text \<open>From a final configuration, that is, when the stack is empty,
+only final configurations are reachable.\<close>
+
+lemma step_empty_stack:
+  assumes "fst x = []"
+  shows "fst (step x) = []"
+  using assms by (metis prod.collapse step.simps(1))
+
+lemma reachable_empty_stack:
+  assumes "fst x = []" and "reachable x y"
+  shows "fst y = []"
+proof -
+  have "fst (iterate t step x) = []" for t
+    using assms step_empty_stack by (induction t) simp_all
+  then show ?thesis
+    using reachable_def assms(2) by auto
+qed
+
+abbreviation nonterminating :: "configuration \<Rightarrow> bool" where
+  "nonterminating x \<equiv> \<forall>t. fst (iterate t step x) \<noteq> []"
+
+lemma reachable_nonterminating:
+  assumes "reachable x y" and "nonterminating y"
+  shows "nonterminating x"
+proof -
+  from assms(1) obtain t\<^sub>1 where t1: "iterate t\<^sub>1 step x = y"
+    using reachable_def by auto
+  have "fst (iterate t step x) \<noteq> []" for t
+  proof (cases "t \<le> t\<^sub>1")
+    case True
+    then show ?thesis
+      using t1 assms(2) reachable_def reachable_empty_stack iterate_additive'
+      by (metis le_Suc_ex)
+  next
+    case False
+    then have "iterate t step x = iterate (t\<^sub>1 + (t - t\<^sub>1)) step x"
+      by simp
+    then have "iterate t step x = iterate (t - t\<^sub>1) step (iterate t\<^sub>1 step x)"
+      by (simp add: iterate_additive')
+    then have "iterate t step x = iterate (t - t\<^sub>1) step y"
+      using t1 by simp
+    then show "fst (iterate t step x) \<noteq> []"
+      using assms(2) by simp
+  qed
+  then show ?thesis ..
+qed
+
+text \<open>The function @{term step} is underdefined, for example, when the
+top frame contains a non-well-formed @{typ recf} or too few arguments. All is
+well, though, if every frame contains a well-formed @{typ recf} whose arity
+matches the number of arguments. Such stacks will be called
+\emph{valid}.\<close>
+
+definition valid :: "frame list \<Rightarrow> bool" where
+  "valid stack \<equiv> \<forall>s\<in>set stack. recfn (length (fst (snd s))) (fst s)"
+
+lemma valid_frame: "valid (s # ss) \<Longrightarrow> valid ss \<and> recfn (length (fst (snd s))) (fst s)"
+  using valid_def by simp
+
+lemma valid_ConsE: "valid ((f, xs, locs) # rest) \<Longrightarrow> valid rest \<and> recfn (length xs) f"
+  using valid_def by simp
+
+lemma valid_ConsI: "valid rest \<Longrightarrow> recfn (length xs) f \<Longrightarrow> valid ((f, xs, locs) # rest)"
+  using valid_def by simp
+
+text \<open>Stacks in initial configurations are valid, and performing a step
+maintains the validity of the stack.\<close>
+
+lemma step_valid: "valid stack \<Longrightarrow> valid (fst (step (stack, rv)))"
+proof (cases stack)
+  case Nil
+  then show ?thesis using valid_def by simp
+next
+  case (Cons s ss)
+  assume valid: "valid stack"
+  then have *: "valid ss \<and> recfn (length (fst (snd s))) (fst s)"
+    using valid_frame Cons by simp
+  show ?thesis
+  proof (cases "fst s")
+    case Z
+    then show ?thesis using Cons valid * by (metis fstI prod.collapse step.simps(2))
+  next
+    case S
+    then show ?thesis using Cons valid * by (metis fst_conv prod.collapse step.simps(3))
+  next
+    case Id
+    then show ?thesis using Cons valid * by (metis fstI prod.collapse step.simps(4))
+  next
+    case (Cn n f gs)
+    then obtain xs ls where "s = (Cn n f gs, xs, ls)"
+      using Cons by (metis prod.collapse)
+    moreover consider
+        "length ls = length gs \<and> rv \<up>"
+      | "length ls = length gs \<and> rv \<down>"
+      | "length ls < length gs \<and> rv \<up>"
+      | "length ls \<noteq> length gs \<and> rv \<down>"
+      | "length ls > length gs \<and> rv \<up>"
+      by linarith
+    ultimately show ?thesis using valid Cons valid_def by (cases) auto
+  next
+    case (Pr n f g)
+    then obtain xs ls where s: "s = (Pr n f g, xs, ls)"
+      using Cons by (metis prod.collapse)
+    consider
+        "length ls = 0 \<and> rv \<up>"
+      | "length ls = 0 \<and> rv \<down>"
+      | "length ls \<noteq> 0 \<and> length ls = Suc (hd xs)"
+      | "length ls \<noteq> 0 \<and> length ls \<noteq> Suc (hd xs) \<and> rv \<up>"
+      | "length ls \<noteq> 0 \<and> length ls \<noteq> Suc (hd xs) \<and> rv \<down>"
+      by linarith
+    then show ?thesis using Cons * valid_def s by (cases) auto
+  next
+    case (Mn n f)
+    then obtain xs ls where s: "s = (Mn n f, xs, ls)"
+      using Cons by (metis prod.collapse)
+    consider
+        "length ls = 0"
+      | "length ls \<noteq> 0 \<and> rv \<up>"
+      | "length ls \<noteq> 0 \<and> rv \<down>"
+      by linarith
+    then show ?thesis using Cons * valid_def s by (cases) auto
+  qed
+qed
+
+corollary iterate_step_valid:
+  assumes "valid stack"
+  shows "valid (fst (iterate t step (stack, rv)))"
+  using assms
+proof (induction t)
+  case 0
+  then show ?case by simp
+next
+  case (Suc t)
+  moreover have "iterate (Suc t) step (stack, rv) = step (iterate t step (stack, rv))"
+    by simp
+  ultimately show ?case using step_valid valid_def by (metis prod.collapse)
+qed
+
+
+subsubsection \<open>Correctness of the step function\<close>
+
+text \<open>The function @{term step} works correctly for a @{typ recf} $f$
+on arguments @{term xs} in some configuration if (1) in case $f$ converges, @{term
+step} reaches a configuration with the topmost frame popped and @{term "eval
+f xs"} in the register, and (2) in case $f$ diverges, @{term step} does not
+reach a final configuration.\<close>
+
+fun correct :: "configuration \<Rightarrow> bool" where
+  "correct ([], r) = True"
+| "correct ((f, xs, ls) # rest, r) =
+    (if eval f xs \<down> then reachable ((f, xs, ls) # rest, r) (rest, eval f xs)
+     else nonterminating ((f, xs, ls) # rest, None))"
+
+lemma correct_convergI:
+  assumes "eval f xs \<down>" and "reachable ((f, xs, ls) # rest, None) (rest, eval f xs)"
+  shows "correct ((f, xs, ls) # rest, None)"
+  using assms by auto
+
+lemma correct_convergE:
+  assumes "correct ((f, xs, ls) # rest, None)" and "eval f xs \<down>"
+  shows "reachable ((f, xs, ls) # rest, None) (rest, eval f xs)"
+  using assms by simp
+
+text \<open>The correctness proof for @{term step} is by structural induction
+on the @{typ recf} in the top frame. The base cases @{term Z}, @{term S},
+and @{term[names_short] Id} are simple. For @{text "X = Cn, Pr, Mn"}, the
+lemmas named @{text reachable_X} show which configurations are reachable for
+@{typ recf}s of shape @{text X}. Building on those, the lemmas named @{text
+step_X_correct} show @{term step}'s correctness for @{text X}.\<close>
+
+lemma reachable_Cn:
+  assumes "valid (((Cn n f gs), xs, []) # rest)" (is "valid ?stack")
+    and "\<And>xs rest. valid ((f, xs, []) # rest) \<Longrightarrow> correct ((f, xs, []) # rest, None)"
+    and "\<And>g xs rest.
+      g \<in> set gs \<Longrightarrow> valid ((g, xs, []) # rest) \<Longrightarrow> correct ((g, xs, []) # rest, None)"
+    and "\<forall>i<k. eval (gs ! i) xs \<down>"
+    and "k \<le> length gs"
+  shows "reachable
+    (?stack, None)
+    ((Cn n f gs, xs, take k (map (\<lambda>g. the (eval g xs)) gs)) # rest, None)"
+  using assms(4,5)
+proof (induction k)
+  case 0
+  then show ?case using reachable_refl by simp
+next
+  case (Suc k)
+  let ?ys = "map (\<lambda>g. the (eval g xs)) gs"
+  from Suc have "k < length gs" by simp
+  have valid: "recfn (length xs) (Cn n f gs)" "valid rest"
+    using assms(1) valid_ConsE[of "(Cn n f gs)"] by simp_all
+  from Suc have "reachable (?stack, None) ((Cn n f gs, xs, take k ?ys) # rest, None)"
+      (is "_ (?stack1, None)")
+    by simp
+  also have "reachable ... ((gs ! k, xs, []) # ?stack1, None)"
+    using step_reachable `k < length gs` by (simp add: min_absorb2)
+  also have "reachable ... (?stack1, eval (gs ! k) xs)"
+      (is "_ (_, ?rv)")
+    using Suc.prems(1) \<open>k < length gs\<close> assms(3) valid valid_ConsI by auto
+  also have "reachable ... ((Cn n f gs, xs, (take (Suc k) ?ys)) # rest, None)"
+      (is "_ (?stack2, None)")
+  proof -
+    have "step (?stack1, ?rv) = ((Cn n f gs, xs, (take k ?ys) @ [the ?rv]) # rest, None)"
+      using Suc by auto
+    also have "... = ((Cn n f gs, xs, (take (Suc k) ?ys)) # rest, None)"
+      by (simp add: \<open>k < length gs\<close> take_Suc_conv_app_nth)
+    finally show ?thesis
+      using step_reachable by simp
+  qed
+  finally show "reachable (?stack, None) (?stack2, None)" .
+qed
+
+lemma step_Cn_correct:
+  assumes "valid (((Cn n f gs), xs, []) # rest)" (is "valid ?stack")
+    and "\<And>xs rest. valid ((f, xs, []) # rest) \<Longrightarrow> correct ((f, xs, []) # rest, None)"
+    and "\<And>g xs rest.
+      g \<in> set gs \<Longrightarrow> valid ((g, xs, []) # rest) \<Longrightarrow> correct ((g, xs, []) # rest, None)"
+  shows "correct (?stack, None)"
+proof -
+  have valid: "recfn (length xs) (Cn n f gs)" "valid rest"
+    using valid_ConsE[OF assms(1)] by auto
+  let ?ys = "map (\<lambda>g. the (eval g xs)) gs"
+  consider
+      (diverg_f) "\<forall>g\<in>set gs. eval g xs \<down>" and "eval f ?ys \<up>"
+    | (diverg_gs) "\<exists>g\<in>set gs. eval g xs \<up>"
+    | (converg) "eval (Cn n f gs) xs \<down>"
+    using valid_ConsE[OF assms(1)] by fastforce
+  then show ?thesis
+  proof (cases)
+    case diverg_f
+    then have "\<forall>i<length gs. eval (gs ! i) xs \<down>" by simp
+    then have "reachable (?stack, None) ((Cn n f gs, xs, ?ys) # rest, None)"
+        (is "_ (?stack1, None)")
+      using reachable_Cn[OF assms, where ?k="length gs"] by simp
+    also have "reachable ... ((f, ?ys, []) # ?stack1, None)" (is "_ (?stack2, None)")
+      by (simp add: step_reachable)
+    finally have "reachable (?stack, None) (?stack2, None)" .
+    moreover have "nonterminating (?stack2, None)"
+      using diverg_f(2) assms(2)[of ?ys ?stack1] valid_ConsE[OF assms(1)] valid_ConsI
+      by auto
+    ultimately have "nonterminating (?stack, None)"
+      using reachable_nonterminating by simp
+    moreover have "eval (Cn n f gs) xs \<up>"
+      using diverg_f(2) assms(1) eval_Cn valid_ConsE by presburger
+    ultimately show ?thesis by simp
+  next
+    case diverg_gs
+    then have ex_i: "\<exists>i<length gs. eval (gs ! i) xs \<up>"
+      using in_set_conv_nth[of _ gs] by auto
+    define k where "k = (LEAST i. i < length gs \<and> eval (gs ! i) xs \<up>)" (is "_ = Least ?P")
+    then have gs_k: "eval (gs ! k) xs \<up>"
+      using LeastI_ex[OF ex_i] by simp
+    have "\<forall>i<k. eval (gs ! i) xs \<down>"
+      using k_def not_less_Least[of _ ?P] LeastI_ex[OF ex_i] by simp
+    moreover from this have "k < length gs"
+      using ex_i less_le_trans not_le by blast
+    ultimately have "reachable (?stack, None) ((Cn n f gs, xs, take k ?ys) # rest, None)"
+      using reachable_Cn[OF assms] by simp
+    also have "reachable ...
+      ((gs ! (length (take k ?ys)), xs, []) # (Cn n f gs, xs, take k ?ys) # rest, None)"
+      (is "_ (?stack1, None)")
+    proof -
+      have "length (take k ?ys) < length gs"
+        by (simp add: \<open>k < length gs\<close> less_imp_le_nat min_less_iff_disj)
+      then show ?thesis using step_reachable by simp
+    qed
+    finally have "reachable (?stack, None) (?stack1, None)" .
+    moreover have "nonterminating (?stack1, None)"
+    proof -
+      have "recfn (length xs) (gs ! k)"
+        using \<open>k < length gs\<close> valid(1) by simp
+      then have "correct (?stack1, None)"
+        using \<open>k < length gs\<close> nth_mem valid valid_ConsI
+          assms(3)[of "gs ! (length (take k ?ys))" xs]
+        by auto
+      moreover have "length (take k ?ys) = k"
+        by (simp add: \<open>k < length gs\<close> less_imp_le_nat min_absorb2)
+      ultimately show ?thesis using gs_k by simp
+    qed
+    ultimately have "nonterminating (?stack, None)"
+      using reachable_nonterminating by simp
+    moreover have "eval (Cn n f gs) xs \<up>"
+      using diverg_gs valid by fastforce
+    ultimately show ?thesis by simp
+  next
+    case converg
+    then have f: "eval f ?ys \<down>" and g: "\<And>g. g \<in> set gs \<Longrightarrow> eval g xs \<down>"
+      using valid(1) by (metis eval_Cn)+
+    then have "\<forall>i<length gs. eval (gs ! i) xs \<down>"
+      by simp
+    then have "reachable (?stack, None) ((Cn n f gs, xs, take (length gs) ?ys) # rest, None)"
+      using reachable_Cn assms by blast
+    also have "reachable ... ((Cn n f gs, xs, ?ys) # rest, None)" (is "_ (?stack1, None)")
+      by (simp add: reachable_refl)
+    also have "reachable ... ((f, ?ys, []) # ?stack1, None)"
+      using step_reachable by simp
+    also have "reachable ... (?stack1, eval f ?ys)"
+      using assms(2)[of "?ys"] correct_convergE valid f valid_ConsI by auto
+    also have "reachable (?stack1, eval f ?ys) (rest, eval f ?ys)"
+      using f by auto
+    finally have "reachable (?stack, None) (rest, eval f ?ys)" .
+    moreover have "eval (Cn n f gs) xs = eval f ?ys"
+      using g valid(1) by auto
+    ultimately show ?thesis
+      using converg correct_convergI by auto
+  qed
+qed
+
+text \<open>During the execution of a frame with a partial recursive function
+of shape @{term "Pr n f g"} and arguments @{term "x # xs"}, the list of local
+variables collects all the function values up to @{term x} in reversed
+order. We call such a list a @{term trace} for short.\<close>
+
+definition trace :: "nat \<Rightarrow> recf \<Rightarrow> recf \<Rightarrow> nat list \<Rightarrow> nat \<Rightarrow> nat list" where
+  "trace n f g xs x \<equiv> map (\<lambda>y. the (eval (Pr n f g) (y # xs))) (rev [0..<Suc x])"
+
+lemma trace_length: "length (trace n f g xs x) = Suc x"
+  using trace_def by simp
+
+lemma trace_hd: "hd (trace n f g xs x) = the (eval (Pr n f g) (x # xs))"
+  using trace_def by simp
+
+lemma trace_Suc:
+  "trace n f g xs (Suc x) = (the (eval (Pr n f g) (Suc x # xs))) # (trace n f g xs x)"
+  using trace_def by simp
+
+lemma reachable_Pr:
+  assumes "valid (((Pr n f g), x # xs, []) # rest)" (is "valid ?stack")
+    and "\<And>xs rest. valid ((f, xs, []) # rest) \<Longrightarrow> correct ((f, xs, []) # rest, None)"
+    and "\<And>xs rest. valid ((g, xs, []) # rest) \<Longrightarrow> correct ((g, xs, []) # rest, None)"
+    and "y \<le> x"
+    and "eval (Pr n f g) (y # xs) \<down>"
+  shows "reachable (?stack, None) ((Pr n f g, x # xs, trace n f g xs y) # rest, None)"
+  using assms(4,5)
+proof (induction y)
+  case 0
+  have valid: "recfn (length (x # xs)) (Pr n f g)" "valid rest"
+    using valid_ConsE[OF assms(1)] by simp_all
+  then have f: "eval f xs \<down>" using 0 by simp
+  let ?as = "x # xs"
+  have "reachable (?stack, None) ((f, xs, []) # ((Pr n f g), ?as, []) # rest, None)"
+    using step_reachable by simp
+  also have "reachable ... (?stack, eval f xs)"
+    using assms(2)[of xs "((Pr n f g), ?as, []) # rest"]
+      correct_convergE[OF _ f] f valid valid_ConsI
+    by simp
+  also have "reachable ... ((Pr n f g, ?as, [the (eval f xs)]) # rest, None)"
+    using step_reachable valid(1) f by simp
+  finally have "reachable (?stack, None) ((Pr n f g, ?as, [the (eval f xs)]) # rest, None)" .
+  then show ?case using trace_def valid(1) by simp
+next
+  case (Suc y)
+  have valid: "recfn (length (x # xs)) (Pr n f g)" "valid rest"
+    using valid_ConsE[OF assms(1)] by simp_all
+  let ?ls = "trace n f g xs y"
+  have lenls: "length ?ls = Suc y"
+    using trace_length by auto
+  moreover have hdls: "hd ?ls = the (eval (Pr n f g) (y # xs))"
+    using Suc trace_hd by auto
+  ultimately have g:
+    "eval g (y # hd ?ls # xs) \<down>"
+    "eval (Pr n f g) (Suc y # xs) = eval g (y # hd ?ls # xs)"
+    using eval_Pr_Suc_converg hdls valid(1) Suc by simp_all
+  then have "reachable (?stack, None) ((Pr n f g, x # xs, ?ls) # rest, None)"
+      (is "_ (?stack1, None)")
+    using Suc valid(1) by fastforce
+  also have "reachable ... ((g, y # hd ?ls # xs, []) # (Pr n f g, x # xs, ?ls) # rest, None)"
+    using Suc.prems lenls by fastforce
+  also have "reachable ... (?stack1, eval g (y # hd ?ls # xs))"
+      (is "_ (_, ?rv)")
+    using assms(3) g(1) valid valid_ConsI by auto
+  also have "reachable ... ((Pr n f g, x # xs, (the ?rv) # ?ls) # rest, None)"
+    using Suc.prems(1) g(1) lenls by auto
+  finally have "reachable (?stack, None) ((Pr n f g, x # xs, (the ?rv) # ?ls) # rest, None)" .
+  moreover have "trace n f g xs (Suc y) = (the ?rv) # ?ls"
+    using g(2) trace_Suc by simp
+  ultimately show ?case by simp
+qed
+
+lemma step_Pr_correct:
+  assumes "valid (((Pr n f g), xs, []) # rest)" (is "valid ?stack")
+    and "\<And>xs rest. valid ((f, xs, []) # rest) \<Longrightarrow> correct ((f, xs, []) # rest, None)"
+    and "\<And>xs rest. valid ((g, xs, []) # rest) \<Longrightarrow> correct ((g, xs, []) # rest, None)"
+  shows "correct (?stack, None)"
+proof -
+  have valid: "valid rest" "recfn (length xs) (Pr n f g)"
+    using valid_ConsE[OF assms(1)] by simp_all
+  then have "length xs > 0"
+    by auto
+  then obtain y ys where y_ys: "xs = y # ys"
+    using list.exhaust_sel by auto
+  let ?t = "trace n f g ys"
+  consider
+      (converg) "eval (Pr n f g) xs \<down>"
+    | (diverg_f) "eval (Pr n f g) xs \<up>" and "eval f ys \<up>"
+    | (diverg) "eval (Pr n f g) xs \<up>" and "eval f ys \<down>"
+    by auto
+  then show ?thesis
+  proof (cases)
+    case converg
+    then have "\<And>z. z \<le> y \<Longrightarrow> reachable (?stack, None) (((Pr n f g), xs, ?t z) # rest, None)"
+      using assms valid by (simp add: eval_Pr_converg_le reachable_Pr y_ys)
+    then have "reachable (?stack, None) (((Pr n f g), xs, ?t y) # rest, None)"
+      by simp
+    moreover have "reachable (((Pr n f g), xs, ?t y) # rest, None) (rest, Some (hd (?t y)))"
+      using trace_length step_reachable y_ys by fastforce
+    ultimately have "reachable (?stack, None) (rest, Some (hd (?t y)))"
+      using reachable_transitive by blast
+    then show ?thesis
+      using assms(1) trace_hd converg y_ys by simp
+  next
+    case diverg_f
+    have *: "step (?stack, None) = ((f, ys, []) # ((Pr n f g), xs, []) # tl ?stack, None)"
+        (is "_ = (?stack1, None)")
+      using assms(1,2) y_ys by simp
+    then have "reachable (?stack, None) (?stack1, None)"
+      using step_reachable by simp
+    moreover have "nonterminating (?stack1, None)"
+      using assms diverg_f valid valid_ConsI * by auto
+    ultimately have "nonterminating (?stack, None)"
+      using reachable_nonterminating by blast
+    then show ?thesis using diverg_f(1) assms(1) by simp
+  next
+    case diverg
+    let ?h = "\<lambda>z. the (eval (Pr n f g) (z # ys))"
+    let ?Q = "\<lambda>z. z < y \<and> eval (Pr n f g) (z # ys) \<down>"
+    have "?Q 0"
+      using assms diverg neq0_conv y_ys valid by fastforce
+    define zmax where "zmax = Greatest ?Q"
+    then have "?Q zmax"
+      using `?Q 0` GreatestI_nat[of ?Q 0 y] by simp
+    have le_zmax: "\<And>z. ?Q z \<Longrightarrow> z \<le> zmax"
+      using Greatest_le_nat[of ?Q _ y] zmax_def by simp
+    have len: "length (?t zmax) < Suc y"
+      by (simp add: \<open>?Q zmax\<close> trace_length)
+    have "eval (Pr n f g) (y # ys) \<down>" if "y \<le> zmax" for y
+      using that zmax_def `?Q zmax` assms eval_Pr_converg_le[of n f g ys zmax y] valid y_ys
+      by simp
+    then have "reachable (?stack, None) (((Pr n f g), xs, ?t y) # rest, None)"
+        if "y \<le> zmax" for y
+      using that `?Q zmax` diverg y_ys assms reachable_Pr by simp
+    then have "reachable (?stack, None) (((Pr n f g), xs, ?t zmax) # rest, None)"
+        (is "reachable _ (?stack1, None)")
+      by simp
+    also have "reachable ...
+        ((g, zmax # ?h zmax # tl xs, []) # (Pr n f g, xs, ?t zmax) # rest, None)"
+        (is "_ (?stack2, None)")
+    proof (rule step_reachable)
+      have "length (?t zmax) \<noteq> Suc (hd xs)"
+        using len y_ys by simp
+      moreover have "hd (?t zmax) = ?h zmax"
+        using trace_hd by auto
+      moreover have "length (?t zmax) = Suc zmax"
+        using trace_length by simp
+      ultimately show "step (?stack1, None) = (?stack2, None)" 
+        by auto
+    qed
+    finally have "reachable (?stack, None) (?stack2, None)" .
+    moreover have "nonterminating (?stack2, None)"
+    proof -
+      have "correct (?stack2, None)"
+        using y_ys assms valid_ConsI valid by simp
+      moreover have "eval g (zmax # ?h zmax # ys) \<up>"
+        using \<open>?Q zmax\<close> diverg le_zmax len less_Suc_eq trace_length y_ys valid
+        by fastforce
+      ultimately show ?thesis using y_ys by simp
+    qed
+    ultimately have "nonterminating (?stack, None)"
+      using reachable_nonterminating by simp
+    then show ?thesis using diverg assms(1) by simp
+  qed
+qed
+
+lemma reachable_Mn:
+  assumes "valid ((Mn n f, xs, []) # rest)" (is "valid ?stack")
+    and "\<And>xs rest. valid ((f, xs, []) # rest) \<Longrightarrow> correct ((f, xs, []) # rest, None)"
+    and "\<forall>y<z. eval f (y # xs) \<notin> {None, Some 0}"
+  shows "reachable (?stack, None) ((f, z # xs, []) # (Mn n f, xs, [z]) # rest, None)"
+  using assms(3)
+proof (induction z)
+  case 0
+  then have "step (?stack, None) = ((f, 0 # xs, []) # (Mn n f, xs, [0]) # rest, None)"
+    using assms by simp
+  then show ?case
+    using step_reachable assms(1) by simp
+next
+  case (Suc z)
+  have valid: "valid rest" "recfn (length xs) (Mn n f)"
+    using valid_ConsE[OF assms(1)] by auto
+  have f: "eval f (z # xs) \<notin> {None, Some 0}"
+    using Suc by simp
+  have "reachable (?stack, None) ((f, z # xs, []) # (Mn n f, xs, [z]) # rest, None)"
+    using Suc by simp
+  also have "reachable ... ((Mn n f, xs, [z]) # rest, eval f (z # xs))"
+    using f assms(2)[of "z # xs"] valid correct_convergE valid_ConsI by auto
+  also have "reachable ... ((f, (Suc z) # xs, []) # (Mn n f, xs, [Suc z]) # rest, None)"
+      (is "_  (?stack1, None)")
+    using step_reachable f by simp
+  finally have "reachable (?stack, None) (?stack1, None)" .
+  then show ?case by simp
+qed
+
+lemma iterate_step_empty_stack: "iterate t step ([], rv) = ([], rv)"
+  using step_empty_stack by (induction t) simp_all
+
+lemma reachable_iterate_step_empty_stack:
+  assumes "reachable cfg ([], rv)"
+  shows "\<exists>t. iterate t step cfg = ([], rv) \<and> (\<forall>t'<t. fst (iterate t' step cfg) \<noteq> [])"
+proof -
+  let ?P = "\<lambda>t. iterate t step cfg = ([], rv)"
+  from assms have "\<exists>t. ?P t"
+    by (simp add: reachable_def)
+  moreover define tmin where "tmin = Least ?P"
+  ultimately have "?P tmin"
+    using LeastI_ex[of ?P] by simp
+  have "fst (iterate t' step cfg) \<noteq> []" if "t' < tmin" for t'
+  proof
+    assume "fst (iterate t' step cfg) = []"
+    then obtain v where v: "iterate t' step cfg = ([], v)"
+      by (metis prod.exhaust_sel)
+    then have "iterate t'' step ([], v) = ([], v)" for t''
+      using iterate_step_empty_stack by simp
+    then have "iterate (t' + t'') step cfg = ([], v)" for t''
+      using v iterate_additive by fast
+    moreover obtain t'' where "t' + t'' = tmin"
+      using \<open>t' < tmin\<close> less_imp_add_positive by auto
+    ultimately have "iterate tmin step cfg = ([], v)"
+      by auto
+    then have "v = rv"
+      using `?P tmin` by simp
+    then have "iterate t' step cfg = ([], rv)"
+      using v by simp
+    moreover have "\<forall>t'<tmin. \<not> ?P t'"
+      unfolding tmin_def using not_less_Least[of _ ?P] by simp
+    ultimately show False
+      using that by simp
+  qed
+  then show ?thesis using `?P tmin` by auto
+qed
+
+lemma step_Mn_correct:
+  assumes "valid ((Mn n f, xs, []) # rest)" (is "valid ?stack")
+    and "\<And>xs rest. valid ((f, xs, []) # rest) \<Longrightarrow> correct ((f, xs, []) # rest, None)"
+  shows "correct (?stack, None)"
+proof -
+  have valid: "valid rest" "recfn (length xs) (Mn n f)"
+    using valid_ConsE[OF assms(1)] by auto
+  consider
+      (diverg) "eval (Mn n f) xs \<up>" and "\<forall>z. eval f (z # xs) \<down>"
+    | (diverg_f) "eval (Mn n f) xs \<up>" and "\<exists>z. eval f (z # xs) \<up>"
+    | (converg) "eval (Mn n f) xs \<down>"
+    by fast
+  then show ?thesis
+  proof (cases)
+    case diverg
+    then have "\<forall>z. eval f (z # xs) \<noteq> Some 0"
+      using eval_Mn_diverg[OF valid(2)] by simp
+    then have "\<forall>y<z. eval f (y # xs) \<notin> {None, Some 0}" for z
+      using diverg by simp
+    then have reach_z:
+      "\<And>z. reachable (?stack, None) ((f, z # xs, []) # (Mn n f, xs, [z]) # rest, None)"
+      using reachable_Mn[OF assms] diverg by simp
+
+    define h :: "nat \<Rightarrow> configuration" where
+      "h z \<equiv> ((f, z # xs, []) # (Mn n f, xs, [z]) # rest, None)" for z
+    then have h_inj: "\<And>x y. x \<noteq> y \<Longrightarrow> h x \<noteq> h y" and z_neq_Nil: "\<And>z. fst (h z) \<noteq> []"
+      by simp_all
+
+    have z: "\<exists>z\<^sub>0. \<forall>z>z\<^sub>0. \<not> (\<exists>t'\<le>t. iterate t' step (?stack, None) = h z)" for t
+    proof (induction t)
+      case 0
+      then show ?case by (metis h_inj le_zero_eq less_not_refl3)
+    next
+      case (Suc t)
+      then show ?case
+        using h_inj by (metis (no_types, hide_lams) le_Suc_eq less_not_refl3 less_trans)
+    qed
+
+    have "nonterminating (?stack, None)"
+    proof (rule ccontr)
+      assume "\<not> nonterminating (?stack, None)"
+      then obtain t where t: "fst (iterate t step (?stack, None)) = []"
+        by auto
+      then obtain z\<^sub>0 where "\<forall>z>z\<^sub>0. \<not> (\<exists>t'\<le>t. iterate t' step (?stack, None) = h z)"
+        using z by auto
+      then have not_h: "\<forall>t'\<le>t. iterate t' step (?stack, None) \<noteq> h (Suc z\<^sub>0)"
+        by simp
+      have "\<forall>t'\<ge>t. fst (iterate t' step (?stack, None)) = []"
+        using t iterate_step_empty_stack iterate_additive'[of t]
+        by (metis le_Suc_ex prod.exhaust_sel)
+      then have "\<forall>t'\<ge>t. iterate t' step (?stack, None) \<noteq> h (Suc z\<^sub>0)"
+        using z_neq_Nil by auto
+      then have "\<forall>t'. iterate t' step (?stack, None) \<noteq> h (Suc z\<^sub>0)"
+        using not_h nat_le_linear by auto
+      then have "\<not> reachable (?stack, None) (h (Suc z\<^sub>0))"
+        using reachable_def by simp
+      then show False
+        using reach_z[of "Suc z\<^sub>0"] h_def by simp
+    qed
+    then show ?thesis using diverg by simp
+  next
+    case diverg_f
+    let ?P = "\<lambda>z. eval f (z # xs) \<up>"
+    define zmin where "zmin \<equiv> Least ?P"
+    then have "\<forall>y<zmin. eval f (y # xs) \<notin> {None, Some 0}"
+      using diverg_f eval_Mn_diverg[OF valid(2)] less_trans not_less_Least[of _ ?P]
+      by blast
+    moreover have f_zmin: "eval f (zmin # xs) \<up>"
+      using diverg_f LeastI_ex[of ?P] zmin_def by simp
+    ultimately have
+      "reachable (?stack, None) ((f, zmin # xs, []) # (Mn n f, xs, [zmin]) # rest, None)"
+        (is "reachable _ (?stack1, None)")
+      using reachable_Mn[OF assms] by simp
+    moreover have "nonterminating (?stack1, None)"
+      using f_zmin assms valid diverg_f valid_ConsI by auto
+    ultimately have "nonterminating (?stack, None)"
+      using reachable_nonterminating by simp
+    then show ?thesis using diverg_f by simp
+  next
+    case converg
+    then obtain z where z: "eval (Mn n f) xs \<down>= z" by auto
+    have f_z: "eval f (z # xs) \<down>= 0"
+      and f_less_z: "\<And>y. y < z \<Longrightarrow> eval f (y # xs) \<down>\<noteq> 0"
+      using eval_Mn_convergE(2,3)[OF valid(2) z] by simp_all
+    then have
+      "reachable (?stack, None) ((f, z # xs, []) # (Mn n f, xs, [z]) # rest, None)"
+      using reachable_Mn[OF assms] by simp
+    also have "reachable ... ((Mn n f, xs, [z]) # rest, eval f (z # xs))"
+      using assms(2)[of "z # xs"] valid f_z valid_ConsI correct_convergE
+      by auto
+    also have "reachable ... (rest, Some z)"
+      using f_z f_less_z step_reachable by simp
+    finally have "reachable (?stack, None) (rest, Some z)" .
+    then show ?thesis using z by simp
+  qed
+qed
+
+theorem step_correct:
+  assumes "valid ((f, xs, []) # rest)"
+  shows "correct ((f, xs, []) # rest, None)"
+  using assms
+proof (induction f arbitrary: xs rest)
+  case Z
+  then show ?case using valid_ConsE[of Z] step_reachable by simp
+next
+  case S
+  then show ?case using valid_ConsE[of S] step_reachable by simp
+next
+  case (Id m n)
+  then show ?case using valid_ConsE[of "Id m n"] by auto
+next
+  case Cn
+  then show ?case using step_Cn_correct by presburger
+next
+  case Pr
+  then show ?case using step_Pr_correct by simp
+next
+  case Mn
+  then show ?case using step_Mn_correct by presburger
+qed
+
+
+subsection \<open>Encoding partial recursive functions\label{s:recf_enc}\<close>
+
+text \<open>In this section we define an injective, but not surjective,
+mapping from @{typ recf}s to natural numbers.\<close>
+
+abbreviation triple_encode :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat" where
+   "triple_encode x y z \<equiv> prod_encode (x, prod_encode (y, z))"
+
+abbreviation quad_encode :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> nat" where
+   "quad_encode w x y z \<equiv> prod_encode (w, prod_encode (x, prod_encode (y, z)))"
+
+fun encode :: "recf \<Rightarrow> nat" where
+  "encode Z = 0"
+| "encode S = 1"
+| "encode (Id m n) = triple_encode 2 m n"
+| "encode (Cn n f gs) = quad_encode 3 n (encode f) (list_encode (map encode gs))"
+| "encode (Pr n f g) = quad_encode 4 n (encode f) (encode g)"
+| "encode (Mn n f) = triple_encode 5 n (encode f)"
+
+lemma prod_encode_gr1: "a > 1 \<Longrightarrow> prod_encode (a, x) > 1"
+  using le_prod_encode_1 less_le_trans by blast
+
+lemma encode_not_Z_or_S: "encode f = prod_encode (a, b) \<Longrightarrow> a > 1 \<Longrightarrow> f \<noteq> Z \<and> f \<noteq> S"
+  by (metis encode.simps(1) encode.simps(2) less_numeral_extra(4) not_one_less_zero
+    prod_encode_gr1)
+
+lemma encode_injective: "encode f = encode g \<Longrightarrow> f = g"
+proof (induction g arbitrary: f)
+  case Z
+  have "\<And>a x. a > 1 \<Longrightarrow> prod_encode (a, x) > 0"
+    using prod_encode_gr1 by (meson less_one less_trans)
+  then have "f \<noteq> Z \<Longrightarrow> encode f > 0"
+    by (cases f) auto
+  then have "encode f = 0 \<Longrightarrow> f = Z" by fastforce
+  then show ?case using Z by simp
+next
+  case S
+  have "\<And>a x. a > 1 \<Longrightarrow> prod_encode (a, x) \<noteq> Suc 0"
+    using prod_encode_gr1 by (metis One_nat_def less_numeral_extra(4))
+  then have "encode f = 1 \<Longrightarrow> f = S"
+    by (cases f) auto
+  then show ?case using S by simp
+next
+  case Id
+  then obtain z where *: "encode f = prod_encode (2, z)" by simp
+  show ?case
+    using Id by (cases f) (simp_all add: * encode_not_Z_or_S prod_encode_eq)
+next
+  case Cn
+  then obtain z where *: "encode f = prod_encode (3, z)" by simp
+  show ?case
+  proof (cases f)
+    case Z
+    then show ?thesis using * encode_not_Z_or_S by simp
+  next
+    case S
+    then show ?thesis using * encode_not_Z_or_S by simp
+  next
+    case Id
+    then show ?thesis using * by (simp add: prod_encode_eq)
+  next
+    case Cn
+    then show ?thesis
+      using * Cn.IH Cn.prems list_decode_encode
+      by (smt encode.simps(4) fst_conv list.inj_map_strong prod_encode_eq snd_conv)
+  next
+    case Pr
+    then show ?thesis using * by (simp add: prod_encode_eq)
+  next
+    case Mn
+    then show ?thesis using * by (simp add: prod_encode_eq)
+  qed
+next
+  case Pr
+  then obtain z where *: "encode f = prod_encode (4, z)" by simp
+  show ?case
+    using Pr by (cases f) (simp_all add: * encode_not_Z_or_S prod_encode_eq)
+next
+  case Mn
+  then obtain z where *: "encode f = prod_encode (5, z)" by simp
+  show ?case
+    using Mn by (cases f) (simp_all add: * encode_not_Z_or_S prod_encode_eq)
+qed
+
+definition encode_kind :: "nat \<Rightarrow> nat" where
+  "encode_kind e \<equiv> if e = 0 then 0 else if e = 1 then 1 else pdec1 e"
+
+lemma encode_kind_0: "encode_kind (encode Z) = 0"
+  unfolding encode_kind_def by simp
+
+lemma encode_kind_1: "encode_kind (encode S) = 1"
+  unfolding encode_kind_def by simp
+
+lemma encode_kind_2: "encode_kind (encode (Id m n)) = 2"
+  unfolding encode_kind_def
+  by (metis encode.simps(1-3) encode_injective fst_conv prod_encode_inverse
+    recf.simps(16) recf.simps(8))
+
+lemma encode_kind_3: "encode_kind (encode (Cn n f gs)) = 3"
+  unfolding encode_kind_def
+  by (metis encode.simps(1,2,4) encode_injective fst_conv prod_encode_inverse
+    recf.simps(10) recf.simps(18))
+
+lemma encode_kind_4: "encode_kind (encode (Pr n f g)) = 4"
+  unfolding encode_kind_def
+  by (metis encode.simps(1,2,5) encode_injective fst_conv prod_encode_inverse
+    recf.simps(12) recf.simps(20))
+
+lemma encode_kind_5: "encode_kind (encode (Mn n f)) = 5"
+  unfolding encode_kind_def
+  by (metis encode.simps(1,2,6) encode_injective fst_conv prod_encode_inverse
+    recf.simps(14) recf.simps(22))
+
+lemmas encode_kind_n =
+  encode_kind_0 encode_kind_1 encode_kind_2 encode_kind_3 encode_kind_4 encode_kind_5
+
+lemma encode_kind_Cn:
+  assumes "encode_kind (encode f) = 3"
+  shows "\<exists>n f' gs. f = Cn n f' gs"
+  using assms encode_kind_n by (cases f) auto
+
+lemma encode_kind_Pr:
+  assumes "encode_kind (encode f) = 4"
+  shows "\<exists>n f' g. f = Pr n f' g"
+  using assms encode_kind_n by (cases f) auto
+
+lemma encode_kind_Mn:
+  assumes "encode_kind (encode f) = 5"
+  shows "\<exists>n g. f = Mn n g"
+  using assms encode_kind_n by (cases f) auto
+
+lemma pdec2_encode_Id: "pdec2 (encode (Id m n)) = prod_encode (m, n)"
+  by simp
+
+lemma pdec2_encode_Pr: "pdec2 (encode (Pr n f g)) = triple_encode n (encode f) (encode g)"
+  by simp
+
+
+subsection \<open>The step function on encoded configurations\label{s:step_enc}\<close>
+
+text \<open>In this section we construct a function @{text "estep :: nat
+\<Rightarrow> nat"} that is equivalent to the function @{text "step ::
+configuration \<Rightarrow> configuration"} except that it applies to encoded
+configurations. We start by defining an encoding for configurations.\<close>
+
+definition encode_frame :: "frame \<Rightarrow> nat" where
+  "encode_frame s \<equiv>
+    triple_encode (encode (fst s)) (list_encode (fst (snd s))) (list_encode (snd (snd s)))" 
+
+lemma encode_frame:
+  "encode_frame (f, xs, ls) = triple_encode (encode f) (list_encode xs) (list_encode ls)"
+  unfolding encode_frame_def by simp
+
+abbreviation encode_option :: "nat option \<Rightarrow> nat" where
+  "encode_option x \<equiv> if x = None then 0 else Suc (the x)"
+
+definition encode_config :: "configuration \<Rightarrow> nat" where
+  "encode_config cfg \<equiv>
+     prod_encode (list_encode (map encode_frame (fst cfg)), encode_option (snd cfg))"
+
+lemma encode_config:
+  "encode_config (ss, rv) = prod_encode (list_encode (map encode_frame ss), encode_option rv)"
+  unfolding encode_config_def by simp
+
+text \<open>Various projections from encoded configurations:\<close>
+
+definition e2stack where "e2stack e \<equiv> pdec1 e"
+definition e2rv where "e2rv e \<equiv> pdec2 e"
+definition e2tail where "e2tail e \<equiv> e_tl (e2stack e)"
+definition e2frame where "e2frame e \<equiv> e_hd (e2stack e)"
+definition e2i where "e2i e \<equiv> pdec1 (e2frame e)"
+definition e2xs where "e2xs e \<equiv> pdec12 (e2frame e)"
+definition e2ls where "e2ls e \<equiv> pdec22 (e2frame e)"
+definition e2lenas where "e2lenas e \<equiv> e_length (e2xs e)"
+definition e2lenls where "e2lenls e \<equiv> e_length (e2ls e)"
+
+lemma e2rv_rv [simp]:
+  "e2rv (encode_config (ss, rv)) = (if rv \<up> then 0 else Suc (the rv))"
+  unfolding e2rv_def using encode_config by simp
+
+lemma e2stack_stack [simp]:
+  "e2stack (encode_config (ss, rv)) = list_encode (map encode_frame ss)"
+  unfolding e2stack_def using encode_config by simp
+
+lemma e2tail_tail [simp]:
+  "e2tail (encode_config (s # ss, rv)) = list_encode (map encode_frame ss)"
+  unfolding e2tail_def using encode_config by fastforce
+
+lemma e2frame_frame [simp]:
+  "e2frame (encode_config (s # ss, rv)) = encode_frame s"
+  unfolding e2frame_def using encode_config by fastforce
+
+lemma e2i_f [simp]:
+  "e2i (encode_config ((f, xs, ls) # ss, rv)) = encode f"
+  unfolding e2i_def using encode_config e2frame_frame encode_frame by force
+
+lemma e2xs_xs [simp]:
+  "e2xs (encode_config ((f, xs, ls) # ss, rv)) = list_encode xs"
+  using e2xs_def e2frame_frame encode_frame by force
+
+lemma e2ls_ls [simp]:
+  "e2ls (encode_config ((f, xs, ls) # ss, rv)) = list_encode ls"
+  using e2ls_def e2frame_frame encode_frame by force
+
+lemma e2lenas_lenas [simp]:
+  "e2lenas (encode_config ((f, xs, ls) # ss, rv)) = length xs"
+  using e2lenas_def e2frame_frame encode_frame by simp
+
+lemma e2lenls_lenls [simp]:
+  "e2lenls (encode_config ((f, xs, ls) # ss, rv)) = length ls"
+  using e2lenls_def e2frame_frame encode_frame by simp
+
+lemma e2stack_0_iff_Nil:
+  assumes "e = encode_config (ss, rv)"
+  shows "e2stack e = 0 \<longleftrightarrow>  ss = []"
+  using assms
+  by (metis list_encode.simps(1) e2stack_stack list_encode_0 map_is_Nil_conv)
+
+lemma e2ls_0_iff_Nil [simp]: "list_decode (e2ls e) = [] \<longleftrightarrow> e2ls e = 0"
+  by (metis list_decode.simps(1) list_encode_decode)
+
+text \<open>We now define @{text eterm} piecemeal by considering the more
+complicated cases @{text Cn}, @{text Pr}, and @{text Mn} separately.\<close>
+
+definition "estep_Cn e \<equiv>
+  if e2lenls e = e_length (pdec222 (e2i e))
+  then if e2rv e = 0
+       then prod_encode (e_cons (triple_encode (pdec122 (e2i e)) (e2ls e) 0) (e2stack e), 0)
+       else prod_encode (e2tail e, e2rv e)
+  else if e2rv e = 0
+       then if e2lenls e < e_length (pdec222 (e2i e))
+            then prod_encode
+              (e_cons
+                (triple_encode (e_nth (pdec222 (e2i e)) (e2lenls e)) (e2xs e) 0)
+                (e2stack e),
+               0)
+            else prod_encode (e2tail e, e2rv e)
+       else prod_encode
+         (e_cons
+           (triple_encode (e2i e) (e2xs e) (e_snoc (e2ls e) (e2rv e - 1)))
+           (e2tail e),
+          0)"
+
+lemma estep_Cn:
+  assumes "c = (((Cn n f gs, xs, ls) # fs), rv)"
+  shows "estep_Cn (encode_config c) = encode_config (step c)"
+  using encode_frame by (simp add: assms estep_Cn_def, simp add: encode_config assms)
+
+definition "estep_Pr e \<equiv>
+  if e2ls e = 0
+  then if e2rv e = 0
+       then prod_encode
+         (e_cons (triple_encode (pdec122 (e2i e)) (e_tl (e2xs e)) 0) (e2stack e),
+          0)
+       else prod_encode
+         (e_cons (triple_encode (e2i e) (e2xs e) (singleton_encode (e2rv e - 1))) (e2tail e),
+          0)
+  else if e2lenls e = Suc (e_hd (e2xs e))
+       then prod_encode (e2tail e, Suc (e_hd (e2ls e)))
+       else if e2rv e = 0
+            then prod_encode
+              (e_cons
+                (triple_encode
+                  (pdec222 (e2i e))
+                  (e_cons (e2lenls e - 1) (e_cons (e_hd (e2ls e)) (e_tl (e2xs e))))
+                  0)
+                (e2stack e),
+                0)
+            else prod_encode
+              (e_cons
+                (triple_encode (e2i e) (e2xs e) (e_cons (e2rv e - 1) (e2ls e))) (e2tail e),
+                0)"
+
+lemma estep_Pr1:
+  assumes "c = (((Pr n f g, xs, ls) # fs), rv)"
+    and "ls \<noteq> []"
+    and "length ls \<noteq> Suc (hd xs)"
+    and "rv \<noteq> None"
+    and "recfn (length xs) (Pr n f g)"
+  shows "estep_Pr (encode_config c) = encode_config (step c)"
+proof -
+  let ?e = "encode_config c"
+  from assms(5) have "length xs > 0" by auto
+  then have eq: "hd xs = e_hd (e2xs ?e)"
+    using assms e_hd_def by auto
+  have "step c = ((Pr n f g, xs, (the rv) # ls) # fs, None)"
+      (is "step c = (?t # ?ss, None)")
+    using assms by simp
+  then have "encode_config (step c) =
+      prod_encode (list_encode (map encode_frame (?t # ?ss)), 0)"
+    using encode_config by simp
+  also have "... =
+      prod_encode (e_cons (encode_frame ?t) (list_encode (map encode_frame (?ss))), 0)"
+    by simp
+  also have "... = prod_encode (e_cons (encode_frame ?t) (e2tail ?e), 0)"
+    using assms(1) by simp
+  also have "... = prod_encode
+      (e_cons
+        (triple_encode (e2i ?e) (e2xs ?e) (e_cons (e2rv ?e - 1) (e2ls ?e)))
+        (e2tail ?e),
+       0)"
+    by (simp add: assms encode_frame)
+  finally show ?thesis
+    using assms eq estep_Pr_def by auto
+qed
+
+lemma estep_Pr2:
+  assumes "c = (((Pr n f g, xs, ls) # fs), rv)"
+    and "ls \<noteq> []"
+    and "length ls \<noteq> Suc (hd xs)"
+    and "rv = None"
+    and "recfn (length xs) (Pr n f g)"
+  shows "estep_Pr (encode_config c) = encode_config (step c)"
+proof -
+  let ?e = "encode_config c"
+  from assms(5) have "length xs > 0" by auto
+  then have eq: "hd xs = e_hd (e2xs ?e)"
+    using assms e_hd_def by auto
+  have "step c = ((g, (length ls - 1) # hd ls # tl xs, []) # (Pr n f g, xs, ls) # fs, None)"
+      (is "step c = (?t # ?ss, None)")
+    using assms by simp
+  then have "encode_config (step c) =
+      prod_encode (list_encode (map encode_frame (?t # ?ss)), 0)"
+    using encode_config by simp
+  also have "... =
+      prod_encode (e_cons (encode_frame ?t) (list_encode (map encode_frame (?ss))), 0)"
+    by simp
+  also have "... = prod_encode (e_cons (encode_frame ?t) (e2stack ?e), 0)"
+    using assms(1) by simp
+  also have "... = prod_encode
+    (e_cons
+      (triple_encode
+        (pdec222 (e2i ?e))
+        (e_cons (e2lenls ?e - 1) (e_cons (e_hd (e2ls ?e)) (e_tl (e2xs ?e))))
+        0)
+      (e2stack ?e),
+     0)"
+    using assms(1,2) encode_frame[of g "(length ls - 1) # hd ls # tl xs" "[]"]
+      pdec2_encode_Pr[of n f g] e2xs_xs e2i_f e2lenls_lenls e2ls_ls e_hd
+    by (metis list_encode.simps(1) list.collapse list_decode_encode
+      prod_encode_inverse snd_conv)
+  finally show ?thesis
+    using assms eq estep_Pr_def by auto
+qed
+
+lemma estep_Pr3:
+  assumes "c = (((Pr n f g, xs, ls) # fs), rv)"
+    and "ls \<noteq> []"
+    and "length ls = Suc (hd xs)"
+    and "recfn (length xs) (Pr n f g)"
+  shows "estep_Pr (encode_config c) = encode_config (step c)"
+proof -
+  let ?e = "encode_config c"
+  from assms(4) have "length xs > 0" by auto
+  then have "hd xs = e_hd (e2xs ?e)"
+    using assms e_hd_def by auto
+  then have "(length ls = Suc (hd xs)) = (e2lenls ?e = Suc (e_hd (e2xs ?e)))"
+    using assms by simp
+  then have *: "estep_Pr ?e = prod_encode (e2tail ?e, Suc (e_hd (e2ls ?e)))"
+    using assms estep_Pr_def by auto
+  have "step c = (fs, Some (hd ls))"
+    using assms(1,2,3) by simp
+  then have "encode_config (step c) =
+      prod_encode (list_encode (map encode_frame fs), encode_option (Some (hd ls)))"
+    using encode_config by simp
+  also have "... =
+      prod_encode (list_encode (map encode_frame fs), encode_option (Some (e_hd (e2ls ?e))))"
+    using assms(1,2) e_hd_def by auto
+  also have "... = prod_encode (list_encode (map encode_frame fs), Suc (e_hd (e2ls ?e)))"
+    by simp
+  also have "... = prod_encode (e2tail ?e, Suc (e_hd (e2ls ?e)))"
+    using assms(1) by simp
+  finally have "encode_config (step c) = prod_encode (e2tail ?e, Suc (e_hd (e2ls ?e)))" .
+  then show ?thesis
+    using estep_Pr_def * by presburger
+qed
+
+lemma estep_Pr4:
+  assumes "c = (((Pr n f g, xs, ls) # fs), rv)" and "ls = []"
+  shows "estep_Pr (encode_config c) = encode_config (step c)"
+  using encode_frame
+  by (simp add: assms estep_Pr_def, simp add: encode_config assms)
+
+lemma estep_Pr:
+  assumes "c = (((Pr n f g, xs, ls) # fs), rv)"
+    and "recfn (length xs) (Pr n f g)"
+  shows "estep_Pr (encode_config c) = encode_config (step c)"
+  using assms estep_Pr1 estep_Pr2 estep_Pr3 estep_Pr4 by simp
+
+definition "estep_Mn e \<equiv>
+  if e2ls e = 0
+  then prod_encode
+    (e_cons
+      (triple_encode (pdec22 (e2i e)) (e_cons 0 (e2xs e)) 0)
+      (e_cons
+        (triple_encode (e2i e) (e2xs e) (singleton_encode 0))
+        (e2tail e)),
+     0)
+  else if e2rv e = 1
+       then prod_encode (e2tail e, Suc (e_hd (e2ls e)))
+       else prod_encode
+        (e_cons
+          (triple_encode (pdec22 (e2i e)) (e_cons (Suc (e_hd (e2ls e))) (e2xs e)) 0)
+          (e_cons
+            (triple_encode (e2i e) (e2xs e) (singleton_encode (Suc (e_hd (e2ls e)))))
+            (e2tail e)),
+        0)"
+
+lemma estep_Mn:
+  assumes "c = (((Mn n f, xs, ls) # fs), rv)"
+  shows "estep_Mn (encode_config c) = encode_config (step c)"
+proof -
+  let ?e = "encode_config c"
+  consider "ls \<noteq> []" and "rv \<noteq> Some 0" | "ls \<noteq> []" and "rv = Some 0" | "ls = []"
+    by auto
+  then show ?thesis
+  proof (cases)
+    case 1
+    then have step_c: "step c =
+       ((f, (Suc (hd ls)) # xs, []) # (Mn n f, xs, [Suc (hd ls)]) # fs, None)"
+        (is "step c = ?cfg")
+      using assms by simp
+    have "estep_Mn ?e =
+      prod_encode
+        (e_cons
+          (triple_encode (encode f) (e_cons (Suc (hd ls)) (list_encode xs)) 0)
+          (e_cons
+            (triple_encode (encode (Mn n f)) (list_encode xs) (singleton_encode (Suc (hd ls))))
+            (list_encode (map encode_frame fs))),
+        0)"
+      using 1 assms e_hd_def estep_Mn_def by auto
+    also have "... = encode_config ?cfg"
+      using encode_config by (simp add: encode_frame)
+    finally show ?thesis
+      using step_c by simp
+  next
+    case 2
+    have "estep_Mn ?e = prod_encode (e2tail ?e, Suc (e_hd (e2ls ?e)))"
+      using 2 assms estep_Mn_def by auto
+    also have "... = prod_encode (e2tail ?e, Suc (hd ls))"
+      using 2 assms e_hd_def by auto
+    also have "... = prod_encode (list_encode (map encode_frame fs), Suc (hd ls))"
+      using assms by simp
+    also have "... = encode_config (fs, Some (hd ls))"
+      using encode_config by simp
+    finally show ?thesis
+      using 2 assms by simp
+  next
+    case 3
+    then show ?thesis
+      using assms encode_frame by (simp add: estep_Mn_def, simp add: encode_config)
+  qed
+qed
+
+definition "estep e \<equiv>
+  if e2stack e = 0 then prod_encode (0, e2rv e)
+  else if e2i e = 0 then prod_encode (e2tail e, 1)
+  else if e2i e = 1 then prod_encode (e2tail e, Suc (Suc (e_hd (e2xs e))))
+  else if encode_kind (e2i e) = 2 then
+    prod_encode (e2tail e, Suc (e_nth (e2xs e) (pdec22 (e2i e))))
+  else if encode_kind (e2i e) = 3 then estep_Cn e
+  else if encode_kind (e2i e) = 4 then estep_Pr e
+  else if encode_kind (e2i e) = 5 then estep_Mn e
+  else 0"
+
+lemma estep_Z:
+  assumes "c = (((Z, xs, ls) # fs), rv)"
+  shows "estep (encode_config c) = encode_config (step c)"
+  using encode_frame by (simp add: assms estep_def, simp add: encode_config assms)
+
+lemma estep_S:
+  assumes "c = (((S, xs, ls) # fs), rv)"
+    and "recfn (length xs) (fst (hd (fst c)))"
+  shows "estep (encode_config c) = encode_config (step c)"
+proof -
+  let ?e = "encode_config c"
+  from assms have "length xs > 0" by auto
+  then have eq: "hd xs = e_hd (e2xs ?e)"
+    using assms(1) e_hd_def by auto
+  then have "estep ?e = prod_encode (e2tail ?e, Suc (Suc (e_hd (e2xs ?e))))"
+    using assms(1) estep_def by simp
+  moreover have "step c = (fs, Some (Suc (hd xs)))"
+    using assms(1) by simp
+  ultimately show ?thesis
+    using assms(1) eq estep_def encode_config[of fs "Some (Suc (hd xs))"] by simp
+qed
+
+lemma estep_Id:
+  assumes "c = (((Id m n, xs, ls) # fs), rv)"
+    and "recfn (length xs) (fst (hd (fst c)))"
+  shows "estep (encode_config c) = encode_config (step c)"
+proof -
+  let ?e = "encode_config c"
+  from assms have "length xs = m" and "m > 0" by auto
+  then have eq: "xs ! n = e_nth (e2xs ?e) n"
+    using assms e_hd_def by auto
+  moreover have "encode_kind (e2i ?e) = 2"
+    using assms(1) encode_kind_2 by auto
+  ultimately have "estep ?e =
+      prod_encode (e2tail ?e, Suc (e_nth (e2xs ?e) (pdec22 (e2i ?e))))"
+    using assms estep_def encode_kind_def by auto
+  moreover have "step c = (fs, Some (xs ! n))"
+    using assms(1) by simp
+  ultimately show ?thesis
+    using assms(1) eq encode_config[of fs "Some (xs ! n)"] by simp
+qed
+
+lemma estep:
+  assumes "valid (fst c)"
+  shows "estep (encode_config c) = encode_config (step c)"
+proof (cases "fst c")
+  case Nil
+  then show ?thesis
+    using estep_def
+    by (metis list_encode.simps(1) e2rv_def e2stack_stack encode_config_def
+      map_is_Nil_conv prod.collapse prod_encode_inverse snd_conv step.simps(1))
+next
+  case (Cons s fs)
+  then obtain f xs ls rv where c: "c = ((f, xs, ls) # fs, rv)"
+    by (metis prod.exhaust_sel)
+  with assms valid_def have lenas: "recfn (length xs) f" by simp
+  show ?thesis
+  proof (cases f)
+    case Z
+    then show ?thesis using estep_Z c by simp
+  next
+    case S
+    then show ?thesis using estep_S c lenas by simp
+  next
+    case Id
+    then show ?thesis using estep_Id c lenas by simp
+  next
+    case Cn
+    then show ?thesis
+      using estep_Cn c
+      by (metis e2i_f e2stack_0_iff_Nil encode.simps(1) encode.simps(2) encode_kind_2
+        encode_kind_3 encode_kind_Cn estep_def list.distinct(1) recf.distinct(13)
+        recf.distinct(19) recf.distinct(5))
+  next
+    case Pr
+    then show ?thesis
+      using estep_Pr c lenas
+      by (metis e2i_f e2stack_0_iff_Nil encode.simps(1) encode.simps(2) encode_kind_2
+        encode_kind_4 encode_kind_Cn encode_kind_Pr estep_def list.distinct(1) recf.distinct(15)
+        recf.distinct(21) recf.distinct(25) recf.distinct(7))
+  next
+    case Mn
+    then show ?thesis
+      using estep_Pr c lenas
+      by (metis (no_types, lifting) e2i_f e2stack_0_iff_Nil encode.simps(1)
+        encode.simps(2) encode_kind_2 encode_kind_5 encode_kind_Cn encode_kind_Mn encode_kind_Pr
+        estep_Mn estep_def list.distinct(1) recf.distinct(17) recf.distinct(23)
+        recf.distinct(27) recf.distinct(9))
+  qed
+qed
+
+subsection \<open>The step function as a partial recursive function\label{s:step_recf}\<close>
+
+text \<open>In this section we construct a primitive recursive function
+@{term r_step} computing @{term estep}. This will entail defining @{typ
+recf}s for many functions defined in the previous section.\<close>
+
+definition "r_e2stack \<equiv> r_pdec1"
+
+lemma r_e2stack_prim: "prim_recfn 1 r_e2stack"
+  unfolding r_e2stack_def using r_pdec1_prim by simp
+
+lemma r_e2stack [simp]: "eval r_e2stack [e] \<down>= e2stack e"
+  unfolding r_e2stack_def e2stack_def using r_pdec1_prim by simp
+
+definition "r_e2rv \<equiv> r_pdec2"
+
+lemma r_e2rv_prim: "prim_recfn 1 r_e2rv"
+  unfolding r_e2rv_def using r_pdec2_prim by simp
+
+lemma r_e2rv [simp]: "eval r_e2rv [e] \<down>= e2rv e"
+  unfolding r_e2rv_def e2rv_def using r_pdec2_prim by simp
+
+definition "r_e2tail \<equiv> Cn 1 r_tl [r_e2stack]"
+
+lemma r_e2tail_prim: "prim_recfn 1 r_e2tail"
+  unfolding r_e2tail_def using r_e2stack_prim r_tl_prim by simp
+
+lemma r_e2tail [simp]: "eval r_e2tail [e] \<down>= e2tail e"
+  unfolding r_e2tail_def e2tail_def using r_e2stack_prim r_tl_prim by simp
+
+definition "r_e2frame \<equiv> Cn 1 r_hd [r_e2stack]"
+
+lemma r_e2frame_prim: "prim_recfn 1 r_e2frame"
+  unfolding r_e2frame_def using r_hd_prim r_e2stack_prim by simp
+
+lemma r_e2frame [simp]: "eval r_e2frame [e] \<down>= e2frame e"
+  unfolding r_e2frame_def e2frame_def using r_hd_prim r_e2stack_prim by simp
+
+definition "r_e2i \<equiv> Cn 1 r_pdec1 [r_e2frame]"
+
+lemma r_e2i_prim: "prim_recfn 1 r_e2i"
+  unfolding r_e2i_def using r_pdec12_prim r_e2frame_prim by simp
+
+lemma r_e2i [simp]: "eval r_e2i [e] \<down>= e2i e"
+  unfolding r_e2i_def e2i_def using r_pdec12_prim r_e2frame_prim by simp
+
+definition "r_e2xs \<equiv> Cn 1 r_pdec12 [r_e2frame]"
+
+lemma r_e2xs_prim: "prim_recfn 1 r_e2xs"
+  unfolding r_e2xs_def using r_pdec122_prim r_e2frame_prim by simp
+
+lemma r_e2xs [simp]: "eval r_e2xs [e] \<down>= e2xs e"
+  unfolding r_e2xs_def e2xs_def using r_pdec122_prim r_e2frame_prim by simp
+
+definition "r_e2ls \<equiv> Cn 1 r_pdec22 [r_e2frame]"
+
+lemma r_e2ls_prim: "prim_recfn 1 r_e2ls"
+  unfolding r_e2ls_def using r_pdec222_prim r_e2frame_prim by simp
+
+lemma r_e2ls [simp]: "eval r_e2ls [e] \<down>= e2ls e"
+  unfolding r_e2ls_def e2ls_def using r_pdec222_prim r_e2frame_prim by simp
+
+definition "r_e2lenls \<equiv> Cn 1 r_length [r_e2ls]"
+
+lemma r_e2lenls_prim: "prim_recfn 1 r_e2lenls"
+  unfolding r_e2lenls_def using r_length_prim r_e2ls_prim by simp
+
+lemma r_e2lenls [simp]: "eval r_e2lenls [e] \<down>= e2lenls e"
+  unfolding r_e2lenls_def e2lenls_def using r_length_prim r_e2ls_prim by simp
+
+definition "r_kind \<equiv>
+  Cn 1 r_ifz [Id 1 0, Z, Cn 1 r_ifeq [Id 1 0, r_const 1, r_const 1, r_pdec1]]"
+
+lemma r_kind_prim: "prim_recfn 1 r_kind"
+  unfolding r_kind_def by simp
+
+lemma r_kind: "eval r_kind [e] \<down>= encode_kind e"
+  unfolding r_kind_def encode_kind_def by simp
+
+lemmas helpers_for_r_step_prim =
+  r_e2i_prim
+  r_e2lenls_prim
+  r_e2ls_prim
+  r_e2rv_prim
+  r_e2xs_prim
+  r_e2stack_prim
+  r_e2tail_prim
+  r_e2frame_prim
+
+text \<open>We define primitive recursive functions @{term r_step_Id}, @{term
+r_step_Cn}, @{term r_step_Pr}, and @{term r_step_Mn}. The last three
+correspond to @{term estep_Cn}, @{term estep_Pr}, and @{term estep_Mn} from
+the previous section.\<close>
+
+definition "r_step_Id \<equiv>
+  Cn 1 r_prod_encode [r_e2tail, Cn 1 S [Cn 1 r_nth [r_e2xs, Cn 1 r_pdec22 [r_e2i]]]]"
+
+lemma r_step_Id:
+  "eval r_step_Id [e] \<down>= prod_encode (e2tail e, Suc (e_nth (e2xs e) (pdec22 (e2i e))))"
+  unfolding r_step_Id_def using helpers_for_r_step_prim by simp
+
+abbreviation r_triple_encode :: "recf \<Rightarrow> recf \<Rightarrow> recf \<Rightarrow> recf" where
+  "r_triple_encode x y z \<equiv> Cn 1 r_prod_encode [x, Cn 1 r_prod_encode [y, z]]"
+
+definition "r_step_Cn \<equiv>
+  Cn 1 r_ifeq
+   [r_e2lenls,
+    Cn 1 r_length [Cn 1 r_pdec222 [r_e2i]],
+    Cn 1 r_ifz
+     [r_e2rv,
+      Cn 1 r_prod_encode
+       [Cn 1 r_cons [r_triple_encode (Cn 1 r_pdec122 [r_e2i]) r_e2ls Z, r_e2stack],
+        Z],
+      Cn 1 r_prod_encode [r_e2tail, r_e2rv]],
+    Cn 1 r_ifz
+     [r_e2rv,
+      Cn 1 r_ifless
+       [r_e2lenls,
+        Cn 1 r_length [Cn 1 r_pdec222 [r_e2i]],
+        Cn 1 r_prod_encode
+         [Cn 1 r_cons
+           [r_triple_encode (Cn 1 r_nth [Cn 1 r_pdec222 [r_e2i], r_e2lenls]) r_e2xs Z,
+            r_e2stack],
+          Z],
+        Cn 1 r_prod_encode [r_e2tail, r_e2rv]],
+      Cn 1 r_prod_encode
+       [Cn 1 r_cons
+         [r_triple_encode r_e2i r_e2xs (Cn 1 r_snoc [r_e2ls, Cn 1 r_dec [r_e2rv]]),
+          r_e2tail],
+        Z]]]"
+
+lemma r_step_Cn_prim: "prim_recfn 1 r_step_Cn"
+  unfolding r_step_Cn_def using helpers_for_r_step_prim by simp
+
+lemma r_step_Cn: "eval r_step_Cn [e] \<down>= estep_Cn e"
+  unfolding r_step_Cn_def estep_Cn_def using helpers_for_r_step_prim by simp
+
+definition "r_step_Pr \<equiv>
+  Cn 1 r_ifz
+   [r_e2ls,
+    Cn 1 r_ifz
+     [r_e2rv,
+      Cn 1 r_prod_encode
+       [Cn 1 r_cons
+         [r_triple_encode (Cn 1 r_pdec122 [r_e2i]) (Cn 1 r_tl [r_e2xs]) Z,
+          r_e2stack],
+        Z],
+      Cn 1 r_prod_encode
+       [Cn 1 r_cons
+         [r_triple_encode r_e2i r_e2xs (Cn 1 r_singleton_encode [Cn 1 r_dec [r_e2rv]]),
+          r_e2tail],
+        Z]],
+    Cn 1 r_ifeq
+     [r_e2lenls,
+      Cn 1 S [Cn 1 r_hd [r_e2xs]],
+      Cn 1 r_prod_encode [r_e2tail, Cn 1 S [Cn 1 r_hd [r_e2ls]]],
+      Cn 1 r_ifz
+        [r_e2rv,
+         Cn 1 r_prod_encode
+           [Cn 1 r_cons
+             [r_triple_encode
+               (Cn 1 r_pdec222 [r_e2i])
+               (Cn 1 r_cons
+                 [Cn 1 r_dec [r_e2lenls],
+                  Cn 1 r_cons [Cn 1 r_hd [r_e2ls],
+                  Cn 1 r_tl [r_e2xs]]])
+               Z,
+              r_e2stack],
+            Z],
+         Cn 1 r_prod_encode
+           [Cn 1 r_cons
+             [r_triple_encode r_e2i r_e2xs (Cn 1 r_cons [Cn 1 r_dec [r_e2rv], r_e2ls]),
+              r_e2tail],
+            Z]]]]"
+
+lemma r_step_Pr_prim: "prim_recfn 1 r_step_Pr"
+  unfolding r_step_Pr_def using helpers_for_r_step_prim by simp
+
+lemma r_step_Pr: "eval r_step_Pr [e] \<down>= estep_Pr e"
+  unfolding r_step_Pr_def estep_Pr_def using helpers_for_r_step_prim by simp
+
+definition "r_step_Mn \<equiv>
+  Cn 1 r_ifz
+   [r_e2ls,
+    Cn 1 r_prod_encode
+      [Cn 1 r_cons
+        [r_triple_encode (Cn 1 r_pdec22 [r_e2i]) (Cn 1 r_cons [Z, r_e2xs]) Z,
+         Cn 1 r_cons
+           [r_triple_encode r_e2i r_e2xs (Cn 1 r_singleton_encode [Z]),
+            r_e2tail]],
+       Z],
+    Cn 1 r_ifeq
+      [r_e2rv,
+       r_const 1,
+       Cn 1 r_prod_encode [r_e2tail, Cn 1 S [Cn 1 r_hd [r_e2ls]]],
+       Cn 1 r_prod_encode
+         [Cn 1 r_cons
+           [r_triple_encode
+             (Cn 1 r_pdec22 [r_e2i])
+             (Cn 1 r_cons [Cn 1 S [Cn 1 r_hd [r_e2ls]], r_e2xs])
+             Z,
+            Cn 1 r_cons
+              [r_triple_encode r_e2i r_e2xs (Cn 1 r_singleton_encode [Cn 1 S [Cn 1 r_hd [r_e2ls]]]),
+               r_e2tail]],
+          Z]]]"
+
+lemma r_step_Mn_prim: "prim_recfn 1 r_step_Mn"
+  unfolding r_step_Mn_def using helpers_for_r_step_prim by simp
+
+lemma r_step_Mn: "eval r_step_Mn [e] \<down>= estep_Mn e"
+  unfolding r_step_Mn_def estep_Mn_def using helpers_for_r_step_prim by simp
+
+definition "r_step \<equiv>
+  Cn 1 r_ifz
+    [r_e2stack,
+     Cn 1 r_prod_encode [Z, r_e2rv],
+     Cn 1 r_ifz
+       [r_e2i,
+        Cn 1 r_prod_encode [r_e2tail, r_const 1],
+        Cn 1 r_ifeq
+          [r_e2i,
+           r_const 1,
+           Cn 1 r_prod_encode [r_e2tail, Cn 1 S [Cn 1 S [Cn 1 r_hd [r_e2xs]]]],
+           Cn 1 r_ifeq
+             [Cn 1 r_kind [r_e2i],
+              r_const 2,
+              Cn 1 r_prod_encode [r_e2tail, Cn 1 S [Cn 1 r_nth [r_e2xs, Cn 1 r_pdec22 [r_e2i]]]],
+              Cn 1 r_ifeq
+                [Cn 1 r_kind [r_e2i],
+                 r_const 3,
+                 r_step_Cn,
+                 Cn 1 r_ifeq
+                   [Cn 1 r_kind [r_e2i],
+                    r_const 4,
+                    r_step_Pr,
+                    Cn 1 r_ifeq
+                      [Cn 1 r_kind [r_e2i], r_const 5, r_step_Mn, Z]]]]]]]"
+
+lemma r_step_prim: "prim_recfn 1 r_step"
+  unfolding r_step_def
+  using r_kind_prim r_step_Mn_prim r_step_Pr_prim r_step_Cn_prim helpers_for_r_step_prim
+  by simp
+
+lemma r_step: "eval r_step [e] \<down>= estep e"
+  unfolding r_step_def estep_def
+  using r_kind_prim r_step_Mn_prim r_step_Pr_prim r_step_Cn_prim helpers_for_r_step_prim
+    r_kind r_step_Cn r_step_Pr r_step_Mn
+  by simp
+
+theorem r_step_equiv_step:
+  assumes "valid (fst c)"
+  shows "eval r_step [encode_config c] \<down>= encode_config (step c)"
+  using r_step estep assms by simp
+
+
+subsection \<open>The universal function\label{s:the_universal}\<close>
+
+text \<open>The next function computes the configuration after arbitrarily
+many steps.\<close>
+
+definition "r_leap \<equiv>
+  Pr 2
+   (Cn 2 r_prod_encode
+     [Cn 2 r_singleton_encode
+       [Cn 2 r_prod_encode [Id 2 0, Cn 2 r_prod_encode [Id 2 1, r_constn 1 0]]],
+      r_constn 1 0])
+   (Cn 4 r_step [Id 4 1])"
+
+lemma r_leap_prim [simp]: "prim_recfn 3 r_leap"
+  unfolding r_leap_def using r_step_prim by simp
+
+lemma r_leap_total: "eval r_leap [t, i, x] \<down>"
+  using prim_recfn_total[OF r_leap_prim] by simp
+
+lemma r_leap:
+  assumes "i = encode f" and "recfn (e_length x) f"
+  shows "eval r_leap [t, i, x] \<down>= encode_config (iterate t step ([(f, list_decode x, [])], None))"
+proof (induction t)
+  case 0
+  then show ?case
+    unfolding r_leap_def using r_step_prim assms encode_config encode_frame by simp
+next
+  case (Suc t)
+  let ?c = "([(f, list_decode x, [])], None)"
+  let ?tc = "iterate t step ?c"
+  have "valid (fst ?c)"
+    using valid_def assms by simp
+  then have valid: "valid (fst ?tc)"
+    using iterate_step_valid by simp
+  have "eval r_leap [Suc t, i, x] =
+      eval (Cn 4 r_step [Id 4 1]) [t, the (eval r_leap [t, i, x]), i, x]"
+    unfolding r_leap_def using eval_Pr_prim_Suc r_step_prim assms by simp
+  then have "eval r_leap [Suc t, i, x] = eval (Cn 4 r_step [Id 4 1]) [t, encode_config ?tc, i, x]"
+    using Suc by simp
+  then have "eval r_leap [Suc t, i, x] = eval r_step [encode_config ?tc]"
+    using r_step_prim by simp
+  then have "eval r_leap [Suc t, i, x] \<down>= encode_config (step ?tc)"
+    by (simp add: r_step_equiv_step valid)
+  then show ?case by simp
+qed
+
+lemma step_leaves_empty_stack_empty:
+  assumes "iterate t step ([(f, list_decode x, [])], None) = ([], Some v)"
+  shows "iterate (t + t') step ([(f, list_decode x, [])], None) = ([], Some v)"
+  using assms by (induction t') simp_all
+
+text \<open>The next function is essentially a convenience wrapper around
+@{term r_leap}. It returns zero if the configuration returned by @{term
+r_leap} is non-final, and @{term "Suc v"} if the configuration is final with
+return value $v$.\<close>
+
+definition "r_result \<equiv>
+  Cn 3 r_ifz [Cn 3 r_pdec1 [r_leap], Cn 3 r_pdec2 [r_leap], r_constn 2 0]"
+
+lemma r_result_prim [simp]: "prim_recfn 3 r_result"
+  unfolding r_result_def using r_leap_prim by simp
+
+lemma r_result_total: "total r_result"
+  using r_result_prim by blast
+
+lemma r_result_empty_stack_None:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "iterate t step ([(f, list_decode x, [])], None) = ([], None)"
+  shows "eval r_result [t, i, x] \<down>= 0"
+  unfolding r_result_def
+  using assms r_leap e2stack_0_iff_Nil e2stack_def e2stack_stack r_leap_total r_leap_prim
+    e2rv_def e2rv_rv
+  by simp
+
+lemma r_result_empty_stack_Some:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "iterate t step ([(f, list_decode x, [])], None) = ([], Some v)"
+  shows "eval r_result [t, i, x] \<down>= Suc v"
+  unfolding r_result_def
+  using assms r_leap e2stack_0_iff_Nil e2stack_def e2stack_stack r_leap_total r_leap_prim
+    e2rv_def e2rv_rv
+  by simp
+
+lemma r_result_empty_stack_stays:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "iterate t step ([(f, list_decode x, [])], None) = ([], Some v)"
+  shows "eval r_result [t + t', i, x] \<down>= Suc v"
+  using assms step_leaves_empty_stack_empty r_result_empty_stack_Some by simp
+
+lemma r_result_nonempty_stack:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "fst (iterate t step ([(f, list_decode x, [])], None)) \<noteq> []"
+  shows "eval r_result [t, i, x] \<down>= 0"
+proof -
+  obtain ss rv where "iterate t step ([(f, list_decode x, [])], None) = (ss, rv)"
+    by fastforce
+  moreover from this assms(3) have "ss \<noteq> []" by simp
+  ultimately have "eval r_leap [t, i, x] \<down>= encode_config (ss, rv)"
+    using assms r_leap by simp
+  then have "eval (Cn 3 r_pdec1 [r_leap]) [t, i, x] \<down>\<noteq> 0"
+    using `ss \<noteq> []` r_leap_prim encode_config r_leap_total list_encode_0
+    by (auto, blast)
+  then show ?thesis unfolding r_result_def using r_leap_prim by auto
+qed
+
+lemma r_result_Suc:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "eval r_result [t, i, x] \<down>= Suc v"
+  shows "iterate t step ([(f, list_decode x, [])], None) = ([], Some v)"
+    (is "?cfg = _")
+proof (cases "fst ?cfg")
+  case Nil
+  then show ?thesis
+    using assms r_result_empty_stack_None r_result_empty_stack_Some
+    by (metis Zero_not_Suc nat.inject option.collapse option.inject prod.exhaust_sel)
+next
+  case Cons
+  then show ?thesis using assms r_result_nonempty_stack by simp
+qed
+
+lemma r_result_converg:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "eval f (list_decode x) \<down>= v"
+  shows "\<exists>t.
+    (\<forall>t'\<ge>t. eval r_result [t', i, x] \<down>= Suc v) \<and>
+    (\<forall>t'<t. eval r_result [t', i, x] \<down>= 0)"
+proof -
+  let ?xs = "list_decode x"
+  let ?stack = "[(f, ?xs, [])]"
+  have "wellf f" using assms(2) by simp
+  moreover have "length ?xs = arity f"
+    using assms(2) by simp
+  ultimately have "correct (?stack, None)"
+    using step_correct valid_def by simp
+  with assms(3) have "reachable (?stack, None) ([], Some v)"
+    by simp
+  then obtain t where
+    "iterate t step (?stack, None) = ([], Some v)"
+    "\<forall>t'<t. fst (iterate t' step (?stack, None)) \<noteq> []"
+    using reachable_iterate_step_empty_stack by blast
+  then have t:
+    "eval r_result [t, i, x] \<down>= Suc v"
+    "\<forall>t'<t. eval r_result [t', i, x] \<down>= 0"
+    using r_result_empty_stack_Some r_result_nonempty_stack assms(1,2)
+    by simp_all
+  then have "eval r_result [t + t', i, x] \<down>= Suc v" for t'
+    using r_result_empty_stack_stays assms r_result_Suc by simp
+  then have "\<forall>t'\<ge>t. eval r_result [t', i, x] \<down>= Suc v"
+    using le_Suc_ex by blast
+  with t(2) show ?thesis by auto
+qed
+
+lemma r_result_diverg:
+  assumes "i = encode f"
+    and "recfn (e_length x) f"
+    and "eval f (list_decode x) \<up>"
+  shows "eval r_result [t, i, x] \<down>= 0"
+proof -
+  let ?xs = "list_decode x"
+  let ?stack = "[(f, ?xs, [])]"
+  have "recfn (length ?xs) f"
+    using assms(2) by auto
+  then have "correct (?stack, None)"
+    using step_correct valid_def by simp
+  with assms(3) have "nonterminating (?stack, None)"
+    by simp
+  then show ?thesis
+    using r_result_nonempty_stack assms(1,2) by simp
+qed
+
+text \<open>Now we can define the universal partial recursive function. This
+function executes @{term r_result} for increasing time bounds, waits for it
+to reach a final configuration, and then extracts its result value. If no
+final configuration is reached, the universal function diverges.\<close>
+
+definition "r_univ \<equiv>
+  Cn 2 r_dec [Cn 2 r_result [Mn 2 (Cn 3 r_not [r_result]), Id 2 0, Id 2 1]]"
+
+lemma r_univ_recfn [simp]: "recfn 2 r_univ"
+  unfolding r_univ_def by simp
+
+theorem r_univ:
+  assumes "i = encode f" and "recfn (e_length x) f"
+  shows "eval r_univ [i, x] = eval f (list_decode x)"
+proof -
+  let ?cond = "Cn 3 r_not [r_result]"
+  let ?while = "Mn 2 ?cond"
+  let ?res = "Cn 2 r_result [?while, Id 2 0, Id 2 1]"
+  let ?xs = "list_decode x"
+  have *: "eval ?cond [t, i, x] \<down>= (if eval r_result [t, i, x] \<down>= 0 then 1 else 0)" for t
+  proof -
+    have "eval ?cond [t, i, x] = eval r_not [the (eval r_result [t, i, x])]"
+      using r_result_total by simp
+    moreover have "eval r_result [t, i, x] \<down>"
+      by (simp add: r_result_total)
+    ultimately show ?thesis by auto
+  qed
+  show ?thesis
+  proof (cases "eval f ?xs \<up>")
+    case True
+    then show ?thesis
+      unfolding r_univ_def using * r_result_diverg[OF assms] eval_Mn_diverg by simp
+  next
+    case False
+    then obtain v where v: "eval f ?xs \<down>= v" by auto
+    then obtain t where t:
+      "\<forall>t'\<ge>t. eval r_result [t', i, x] \<down>= Suc v"
+      "\<forall>t'<t. eval r_result [t', i, x] \<down>= 0"
+      using r_result_converg[OF assms] by blast
+    then have
+      "\<forall>t'\<ge>t. eval ?cond [t', i, x] \<down>= 0"
+      "\<forall>t'<t. eval ?cond [t', i, x] \<down>= 1"
+      using * by simp_all
+    then have "eval ?while [i, x] \<down>= t"
+      using eval_Mn_convergI[of 2 ?cond "[i, x]" t] by simp
+    then have "eval ?res [i, x] = eval r_result [t, i, x]"
+      by simp
+    then have "eval ?res [i, x] \<down>= Suc v"
+      using t(1) by simp
+    then show ?thesis
+      unfolding r_univ_def using v by simp
+  qed
+qed
+
+theorem r_univ':
+  assumes "recfn (e_length x) f"
+  shows "eval r_univ [encode f, x] = eval f (list_decode x)"
+  using r_univ assms by simp
+
+text \<open>Universal functions for every arity can be built from @{term "r_univ"}.\<close>
+
+definition r_universal :: "nat \<Rightarrow> recf" where
+  "r_universal n \<equiv> Cn (Suc n) r_univ [Id (Suc n) 0, r_shift (r_list_encode (n - 1))]"
+
+lemma r_universal_recfn [simp]: "n > 0 \<Longrightarrow> recfn (Suc n) (r_universal n)"
+  unfolding r_universal_def by simp
+
+lemma r_universal:
+  assumes "recfn n f" and "length xs = n"
+  shows "eval (r_universal n) (encode f # xs) = eval f xs"
+  unfolding r_universal_def using wellf_arity_nonzero assms r_list_encode r_univ'
+  by fastforce
+
+text \<open>We will mostly be concerned with computing unary functions. Hence
+we introduce separate functions for this case.\<close>
+
+definition "r_result1 \<equiv>
+  Cn 3 r_result [Id 3 0, Id 3 1, Cn 3 r_singleton_encode [Id 3 2]]"
+
+lemma r_result1_prim [simp]: "prim_recfn 3 r_result1"
+  unfolding r_result1_def by simp
+
+lemma r_result1_total: "total r_result1"
+  using Mn_free_imp_total by simp
+
+lemma r_result1 [simp]:
+  "eval r_result1 [t, i, x] = eval r_result [t, i, singleton_encode x]"
+  unfolding r_result1_def by simp
+
+text \<open>The following function will be our standard Gödel numbering
+of all unary partial recursive functions.\<close>
+
+definition "r_phi \<equiv> r_universal 1"
+
+lemma r_phi_recfn [simp]: "recfn 2 r_phi"
+  unfolding r_phi_def by simp
+
+theorem r_phi:
+  assumes "i = encode f" and "recfn 1 f"
+  shows "eval r_phi [i, x] = eval f [x]"
+  unfolding r_phi_def using r_universal assms by simp
+
+corollary r_phi':
+  assumes "recfn 1 f"
+  shows "eval r_phi [encode f, x] = eval f [x]"
+  using assms r_phi by simp
+
+lemma r_phi'': "eval r_phi [i, x] = eval r_univ [i, singleton_encode x]"
+  unfolding r_universal_def r_phi_def using r_list_encode by simp
+
+
+section \<open>Applications of the universal function\<close>
+
+text \<open>In this section we shall see some ways @{term r_univ} and @{term r_result} can
+be used.\<close>
+
+subsection \<open>Lazy conditional evaluation\<close>
+
+text \<open>With the help of @{term r_univ} we can now define a
+\hypertarget{p:r_lifz}{lazy variant} of @{term r_ifz}, in which only one
+branch is evaluated.\<close>
+
+definition r_lazyifzero :: "nat \<Rightarrow> nat \<Rightarrow> nat \<Rightarrow> recf" where
+  "r_lazyifzero n j\<^sub>1 j\<^sub>2 \<equiv>
+     Cn (Suc (Suc n)) r_univ
+      [Cn (Suc (Suc n)) r_ifz [Id (Suc (Suc n)) 0, r_constn (Suc n) j\<^sub>1, r_constn (Suc n) j\<^sub>2],
+       r_shift (r_list_encode n)]"
+
+lemma r_lazyifzero_recfn: "recfn (Suc (Suc n)) (r_lazyifzero n j\<^sub>1 j\<^sub>2)"
+  using r_lazyifzero_def by simp
+
+lemma r_lazyifzero:
+  assumes "length xs = Suc n"
+    and "j\<^sub>1 = encode f\<^sub>1"
+    and "j\<^sub>2 = encode f\<^sub>2"
+    and "recfn (Suc n) f\<^sub>1"
+    and "recfn (Suc n) f\<^sub>2"
+  shows "eval (r_lazyifzero n j\<^sub>1 j\<^sub>2) (c # xs) = (if c = 0 then eval f\<^sub>1 xs else eval f\<^sub>2 xs)"
+proof -
+  let ?a = "r_constn (Suc n) n"
+  let ?b = "Cn (Suc (Suc n)) r_ifz
+    [Id (Suc (Suc n)) 0, r_constn (Suc n) j\<^sub>1, r_constn (Suc n) j\<^sub>2]"
+  let ?c = "r_shift (r_list_encode n)"
+  have "eval ?a (c # xs) \<down>= n"
+    using assms(1) by simp
+  moreover have "eval ?b (c # xs) \<down>= (if c = 0 then j\<^sub>1 else j\<^sub>2)"
+    using assms(1) by simp
+  moreover have "eval ?c (c # xs) \<down>= list_encode xs"
+    using assms(1) r_list_encode r_shift by simp
+  ultimately have "eval (r_lazyifzero n j\<^sub>1 j\<^sub>2) (c # xs) =
+      eval r_univ [if c = 0 then j\<^sub>1 else j\<^sub>2, list_encode xs]"
+    unfolding r_lazyifzero_def using r_lazyifzero_recfn assms(1) by simp
+  then show ?thesis using assms r_univ by simp
+qed
+
+definition r_lifz :: "recf \<Rightarrow> recf \<Rightarrow> recf" where
+  "r_lifz f g \<equiv> r_lazyifzero (arity f - 1) (encode f) (encode g)"
+
+lemma r_lifz_recfn [simp]:
+  assumes "recfn n f" and "recfn n g"
+  shows "recfn (Suc n) (r_lifz f g)"
+  using assms r_lazyifzero_recfn r_lifz_def wellf_arity_nonzero by auto
+
+lemma r_lifz [simp]:
+  assumes "length xs = n" and "recfn n f" and "recfn n g"
+  shows "eval (r_lifz f g) (c # xs) = (if c = 0 then eval f xs else eval g xs)"
+  using assms r_lazyifzero r_lifz_def wellf_arity_nonzero
+  by (metis One_nat_def Suc_pred)
+
+
+subsection \<open>Enumerating the domains of partial recursive functions\<close>
+
+text \<open>In this section we define a binary function $\mathit{enumdom}$
+such that for all $i$, the domain of $\varphi_i$ equals
+$\{\mathit{enumdom}(i, x) \mid \mathit{enumdom}(i, x)\!\downarrow\}$. In
+other words, the image of $\mathit{enumdom}_i$ is the domain of $\varphi_i$.
+
+First we need some more properties of @{term r_leap} and @{term r_result}.\<close>
+
+lemma r_leap_Suc: "eval r_leap [Suc t, i, x] = eval r_step [the (eval r_leap [t, i, x])]"
+proof -
+  have "eval r_leap [Suc t, i, x] =
+      eval (Cn 4 r_step [Id 4 1]) [t, the (eval r_leap [t, i, x]), i, x]"
+    using r_leap_total eval_Pr_converg_Suc r_leap_def
+    by (metis length_Cons list.size(3) numeral_2_eq_2 numeral_3_eq_3 r_leap_prim)
+  then show ?thesis using r_step_prim by auto
+qed
+
+lemma r_leap_Suc_saturating:
+  assumes "pdec1 (the (eval r_leap [t, i, x])) = 0"
+  shows "eval r_leap [Suc t, i, x] = eval r_leap [t, i, x]"
+proof -
+  let ?e = "eval r_leap [t, i, x]"
+  have "eval r_step [the ?e] \<down>= estep (the ?e)"
+    using r_step by simp
+  then have "eval r_step [the ?e] \<down>= prod_encode (0, e2rv (the ?e))"
+    using estep_def assms by (simp add: e2stack_def)
+  then have "eval r_step [the ?e] \<down>= prod_encode (pdec1 (the ?e), pdec2 (the ?e))"
+    using assms by (simp add: e2rv_def)
+  then have "eval r_step [the ?e] \<down>= the ?e" by simp
+  then show ?thesis using r_leap_total r_leap_Suc by simp
+qed
+
+lemma r_result_Suc_saturating:
+  assumes "eval r_result [t, i, x] \<down>= Suc v"
+  shows "eval r_result [Suc t, i, x] \<down>= Suc v"
+proof -
+  let ?r = "\<lambda>t. eval r_ifz [pdec1 (the (eval r_leap [t, i, x])), pdec2 (the (eval r_leap [t, i, x])), 0]"
+  have "?r t \<down>= Suc v"
+    using assms unfolding r_result_def using r_leap_total r_leap_prim by simp
+  then have "pdec1 (the (eval r_leap [t, i, x])) = 0"
+    using option.sel by fastforce
+  then have "eval r_leap [Suc t, i, x] = eval r_leap [t, i, x]"
+    using r_leap_Suc_saturating by simp
+  moreover have "eval r_result [t, i, x] = ?r t"
+    unfolding r_result_def using r_leap_total r_leap_prim by simp
+  moreover have "eval r_result [Suc t, i, x] = ?r (Suc t)"
+    unfolding r_result_def using r_leap_total r_leap_prim by simp
+  ultimately have "eval r_result [Suc t, i, x] = eval r_result [t, i, x]"
+    by simp
+  with assms show ?thesis by simp
+qed
+
+lemma r_result_saturating:
+  assumes "eval r_result [t, i, x] \<down>= Suc v"
+  shows "eval r_result [t + d, i, x] \<down>= Suc v"
+  using r_result_Suc_saturating assms by (induction d) simp_all
+
+lemma r_result_converg':
+  assumes "eval r_univ [i, x] \<down>= v"
+  shows "\<exists>t. (\<forall>t'\<ge>t. eval r_result [t', i, x] \<down>= Suc v) \<and> (\<forall>t'<t. eval r_result [t', i, x] \<down>= 0)"
+proof -
+  let ?f = "Cn 3 r_not [r_result]"
+  let ?m = "Mn 2 ?f"
+  have "recfn 2 ?m" by simp
+  have eval_m: "eval ?m [i, x] \<down>"
+  proof
+    assume "eval ?m [i, x] \<up>"
+    then have "eval r_univ [i, x] \<up>"
+      unfolding r_univ_def by simp
+    with assms show False by simp
+  qed
+  then obtain t where t: "eval ?m [i, x] \<down>= t"
+    by auto
+  then have f_t: "eval ?f [t, i, x] \<down>= 0" and f_less_t: "\<And>y. y < t \<Longrightarrow> eval ?f [y, i, x] \<down>\<noteq> 0"
+    using eval_Mn_convergE[of 2 ?f "[i, x]" t] `recfn 2 ?m`
+    by (metis (no_types, lifting) One_nat_def Suc_1 length_Cons list.size(3))+
+  have eval_Cn2: "eval (Cn 2 r_result [?m, Id 2 0, Id 2 1]) [i, x] \<down>"
+  proof
+    assume "eval (Cn 2 r_result [?m, Id 2 0, Id 2 1]) [i, x] \<up>"
+    then have "eval r_univ [i, x] \<up>"
+      unfolding r_univ_def by simp
+    with assms show False by simp
+  qed
+  have "eval r_result [t, i, x] \<down>= Suc v"
+  proof (rule ccontr)
+    assume neq_Suc: "\<not> eval r_result [t, i, x] \<down>= Suc v"
+    show False
+    proof (cases "eval r_result [t, i, x] = None")
+      case True
+      then show ?thesis using f_t by simp
+    next
+      case False
+      then obtain w where w: "eval r_result [t, i, x] \<down>= w" "w \<noteq> Suc v"
+        using neq_Suc by auto
+      moreover have "eval r_result [t, i, x] \<down>\<noteq> 0"
+        by (rule ccontr; use f_t in auto)
+      ultimately have "w \<noteq> 0" by simp
+      have "eval (Cn 2 r_result [?m, Id 2 0, Id 2 1]) [i, x] =
+          eval r_result [the (eval ?m [i, x]), i, x]"
+        using eval_m by simp
+      with w t have "eval (Cn 2 r_result [?m, Id 2 0, Id 2 1]) [i, x] \<down>= w"
+        by simp
+      moreover have "eval r_univ [i, x] =
+          eval r_dec [the (eval (Cn 2 r_result [?m, Id 2 0, Id 2 1]) [i, x])]"
+        unfolding r_univ_def using eval_Cn2 by simp
+      ultimately have "eval r_univ [i, x] = eval r_dec [w]" by simp
+      then have "eval r_univ [i, x] \<down>= w - 1" by simp
+      with assms `w \<noteq> 0` w show ?thesis by simp
+    qed
+  qed
+  then have "\<forall>t'\<ge>t. eval r_result [t', i, x] \<down>= Suc v"
+    using r_result_saturating le_Suc_ex by blast
+  moreover have "eval r_result [y, i, x] \<down>= 0" if "y < t" for y
+  proof (rule ccontr)
+    assume neq0: "eval r_result [y, i, x] \<noteq> Some 0"
+    then show False
+    proof (cases "eval r_result [y, i, x] = None")
+      case True
+      then show ?thesis using f_less_t `y < t` by fastforce
+    next
+      case False
+      then obtain v where "eval r_result [y, i, x] \<down>= v" "v \<noteq> 0"
+        using neq0 by auto
+      then have "eval ?f [y, i, x] \<down>= 0" by simp
+      then show ?thesis using f_less_t `y < t` by simp
+    qed
+  qed
+  ultimately show ?thesis by auto
+qed
+
+lemma r_result_diverg':
+  assumes "eval r_univ [i, x] \<up>"
+  shows "eval r_result [t, i, x] \<down>= 0"
+proof (rule ccontr)
+  let ?f = "Cn 3 r_not [r_result]"
+  let ?m = "Mn 2 ?f"
+  assume "eval r_result [t, i, x] \<noteq> Some 0"
+  with r_result_total have "eval r_result [t, i, x] \<down>\<noteq> 0" by simp
+  then have "eval ?f [t, i, x] \<down>= 0" by auto
+  moreover have "eval ?f [y, i, x] \<down>" if "y < t" for y
+    using  r_result_total by simp
+  ultimately have "\<exists>z. eval ?f (z # [i, x]) \<down>= 0 \<and> (\<forall>y<z. eval ?f (y # [i, x]) \<down>)"
+    by blast
+  then have "eval ?m [i, x] \<down>" by simp
+  then have "eval r_univ [i, x] \<down>"
+    unfolding r_univ_def using r_result_total by simp
+  with assms show False by simp
+qed
+
+lemma r_result_bivalent':
+  assumes "eval r_univ [i, x] \<down>= v"
+  shows "eval r_result [t, i, x] \<down>= Suc v \<or> eval r_result [t, i, x] \<down>= 0"
+  using r_result_converg'[OF assms] not_less by blast
+
+lemma r_result_Some':
+  assumes "eval r_result [t, i, x] \<down>= Suc v"
+  shows "eval r_univ [i, x] \<down>= v"
+proof (rule ccontr)
+  assume not_v: "\<not> eval r_univ [i, x] \<down>= v"
+  show False
+  proof (cases "eval r_univ [i, x] \<up>")
+    case True
+    then show ?thesis 
+      using assms r_result_diverg' by simp
+  next
+    case False
+    then obtain w where w: "eval r_univ [i, x] \<down>= w" "w \<noteq> v"
+      using not_v by auto
+    then have "eval r_result [t, i, x] \<down>= Suc w \<or> eval r_result [t, i, x] \<down>= 0"
+      using r_result_bivalent' by simp
+    then show ?thesis using assms not_v w by simp
+  qed
+qed
+
+lemma r_result1_converg':
+  assumes "eval r_phi [i, x] \<down>= v"
+  shows "\<exists>t.
+    (\<forall>t'\<ge>t. eval r_result1 [t', i, x] \<down>= Suc v) \<and>
+    (\<forall>t'<t. eval r_result1 [t', i, x] \<down>= 0)"
+  using assms r_result1 r_result_converg' r_phi'' by simp
+
+lemma r_result1_diverg':
+  assumes "eval r_phi [i, x] \<up>"
+  shows "eval r_result1 [t, i, x] \<down>= 0"
+  using assms r_result1 r_result_diverg' r_phi'' by simp
+
+lemma r_result1_Some':
+  assumes "eval r_result1 [t, i, x] \<down>= Suc v"
+  shows "eval r_phi [i, x] \<down>= v"
+  using assms r_result1 r_result_Some' r_phi'' by simp
+
+text \<open>The next function performs dovetailing in order to evaluate
+$\varphi_i$ for every argument for arbitrarily many steps. Given $i$ and $z$,
+the function decodes $z$ into a pair $(x, t$) and outputs zero (meaning
+``true'') iff.\ the computation of $\varphi_i$ on input $x$ halts after at most
+$t$ steps. Fixing $i$ and varying $z$ will eventually compute $\varphi_i$
+for every argument in the domain of $\varphi_i$ sufficiently long for it to
+converge.\<close>
+
+definition "r_dovetail \<equiv>
+  Cn 2 r_not [Cn 2 r_result1 [Cn 2 r_pdec2 [Id 2 1], Id 2 0, Cn 2 r_pdec1 [Id 2 1]]]"
+
+lemma r_dovetail_prim: "prim_recfn 2 r_dovetail"
+  by (simp add: r_dovetail_def)
+
+lemma r_dovetail:
+  "eval r_dovetail [i, z] \<down>=
+    (if the (eval r_result1 [pdec2 z, i, pdec1 z]) > 0 then 0 else 1)"
+  unfolding r_dovetail_def using r_result_total by simp
+
+text \<open>The function $\mathit{enumdom}$ works as follows in order to
+enumerate exactly the domain of $\varphi_i$. Given $i$ and $y$ it searches
+for the minimum $z \geq y$ for which the dovetail function returns true. This
+$z$ is decoded into $(x, t)$ and the $x$ is output. In this way every value
+output by $\mathit{enumdom}$ is in the domain of $\varphi_i$ by construction
+of @{term r_dovetail}. Conversely an $x$ in the domain will be output for $y
+= (x, t)$ where $t$ is such that $\varphi_i$ halts on $x$ within $t$
+steps.\<close>
+
+definition "r_dovedelay \<equiv>
+  Cn 3 r_and
+    [Cn 3 r_dovetail [Id 3 1, Id 3 0],
+     Cn 3 r_ifle [Id 3 2, Id 3 0, r_constn 2 0, r_constn 2 1]]"
+
+lemma r_dovedelay_prim: "prim_recfn 3 r_dovedelay"
+  unfolding r_dovedelay_def using r_dovetail_prim by simp
+
+lemma r_dovedelay:
+  "eval r_dovedelay [z, i, y] \<down>=
+    (if the (eval r_result1 [pdec2 z, i, pdec1 z]) > 0 \<and> y \<le> z then 0 else 1)"
+  by (simp add: r_dovedelay_def r_dovetail r_dovetail_prim)
+
+definition "r_enumdom \<equiv> Cn 2 r_pdec1 [Mn 2 r_dovedelay]"
+
+lemma r_enumdom_recfn [simp]: "recfn 2 r_enumdom"
+  by (simp add: r_enumdom_def r_dovedelay_prim)
+
+lemma r_enumdom [simp]:
+  "eval r_enumdom [i, y] =
+    (if \<exists>z. eval r_dovedelay [z, i, y] \<down>= 0
+     then Some (pdec1 (LEAST z. eval r_dovedelay [z, i, y] \<down>= 0))
+     else None)"
+proof -
+  let ?h = "Mn 2 r_dovedelay"
+  have "total r_dovedelay"
+    using r_dovedelay_prim by blast
+  then have "eval ?h [i, y] =
+    (if (\<exists>z. eval r_dovedelay [z, i, y] \<down>= 0)
+     then Some (LEAST z. eval r_dovedelay [z, i, y] \<down>= 0)
+     else None)"
+    using r_dovedelay_prim r_enumdom_recfn eval_Mn_convergI by simp
+  then show ?thesis
+    unfolding r_enumdom_def using r_dovedelay_prim by simp
+qed
+
+text \<open>If @{term i} is the code of the empty function, @{term r_enumdom}
+has an empty domain, too.\<close>
+
+lemma r_enumdom_empty_domain:
+  assumes "\<And>x. eval r_phi [i, x] \<up>"
+  shows "\<And>y. eval r_enumdom [i, y] \<up>"
+  using assms r_result1_diverg' r_dovedelay by simp
+
+text \<open>If @{term i} is the code of a function with non-empty domain,
+@{term r_enumdom} enumerates its domain.\<close>
+
+lemma r_enumdom_nonempty_domain:
+  assumes "eval r_phi [i, x\<^sub>0] \<down>"
+  shows "\<And>y. eval r_enumdom [i, y] \<down>"
+    and "\<And>x. eval r_phi [i, x] \<down> \<longleftrightarrow> (\<exists>y. eval r_enumdom [i, y] \<down>= x)"
+proof -
+  show "eval r_enumdom [i, y] \<down>" for y
+  proof -
+    obtain t where t: "\<forall>t'\<ge>t. the (eval r_result1 [t', i, x\<^sub>0]) > 0"
+      using assms r_result1_converg' by fastforce
+    let ?z = "prod_encode (x\<^sub>0, max t y)"
+    have "y \<le> ?z"
+      using le_prod_encode_2 max.bounded_iff by blast
+    moreover have "pdec2 ?z \<ge> t" by simp
+    ultimately have "the (eval r_result1 [pdec2 ?z, i, pdec1 ?z]) > 0"
+      using t by simp
+    with `y \<le> ?z` r_dovedelay have "eval r_dovedelay [?z, i, y] \<down>= 0"
+      by presburger
+    then show "eval r_enumdom [i, y] \<down>"
+      using r_enumdom by auto
+  qed
+  show "eval r_phi [i, x] \<down> = (\<exists>y. eval r_enumdom [i, y] \<down>= x)" for x
+  proof
+    show "\<exists>y. eval r_enumdom [i, y] \<down>= x" if "eval r_phi [i, x] \<down>" for x
+    proof -
+      from that obtain v where "eval r_phi [i, x] \<down>= v" by auto
+      then obtain t where t: "the (eval r_result1 [t, i, x]) > 0"
+        using r_result1_converg' assms
+        by (metis Zero_not_Suc dual_order.refl option.sel zero_less_iff_neq_zero)
+      let ?y = "prod_encode (x, t)"
+      have "eval r_dovedelay [?y, i, ?y] \<down>= 0"
+        using r_dovedelay t by simp
+      moreover from this have "(LEAST z. eval r_dovedelay [z, i, ?y] \<down>= 0) = ?y"
+        using gr_implies_not_zero r_dovedelay by (intro Least_equality; fastforce)
+      ultimately have "eval r_enumdom [i, ?y] \<down>= x"
+        using r_enumdom by auto
+      then show ?thesis by blast
+    qed
+    show "eval r_phi [i, x] \<down>" if "\<exists>y. eval r_enumdom [i, y] \<down>= x" for x
+    proof -
+      from that obtain y where y: "eval r_enumdom [i, y] \<down>= x"
+        by auto
+      then have "eval r_enumdom [i, y] \<down>"
+        by simp
+      then have
+        "\<exists>z. eval r_dovedelay [z, i, y] \<down>= 0" and
+        *: "eval r_enumdom [i, y] \<down>= pdec1 (LEAST z. eval r_dovedelay [z, i, y] \<down>= 0)"
+          (is "_ \<down>= pdec1 ?z")
+        using r_enumdom by metis+
+      then have z: "eval r_dovedelay [?z, i, y] \<down>= 0"
+        by (meson wellorder_Least_lemma(1))
+      have "the (eval r_result1 [pdec2 ?z, i, pdec1 ?z]) > 0"
+      proof (rule ccontr)
+        assume "\<not> (the (eval r_result1 [pdec2 ?z, i, pdec1 ?z]) > 0)"
+        then show False
+          using r_dovedelay z by simp
+      qed
+      then have "eval r_phi [i, pdec1 ?z] \<down>"
+        using r_result1_diverg' assms by fastforce
+      then show ?thesis using y * by auto
+    qed
+  qed
+qed
+
+text \<open>For every $\varphi_i$ with non-empty domain there is a total
+recursive function that enumerates the domain of $\varphi_i$.\<close>
+
+lemma nonempty_domain_enumerable:
+  assumes "eval r_phi [i, x\<^sub>0] \<down>"
+  shows "\<exists>g. recfn 1 g \<and> total g \<and> (\<forall>x. eval r_phi [i, x] \<down> \<longleftrightarrow> (\<exists>y. eval g [y] \<down>= x))"
+proof -
+  define g where "g \<equiv> Cn 1 r_enumdom [r_const i, Id 1 0]"
+  then have "recfn 1 g" by simp
+  moreover from this have "total g"
+    using totalI1[of g] g_def assms r_enumdom_nonempty_domain(1) by simp
+  moreover have "eval r_phi [i, x] \<down> \<longleftrightarrow> (\<exists>y. eval g [y] \<down>= x)" for x
+    unfolding g_def using r_enumdom_nonempty_domain(2)[OF assms] by simp
+  ultimately show ?thesis by auto
+qed
+
+
+subsection \<open>Concurrent evaluation of functions\<close>
+
+text \<open>We define a function that simulates two @{typ recf}s
+``concurrently'' for the same argument and returns the result of the one
+converging first. If both diverge, so does the simulation function.\<close>
+
+definition "r_both \<equiv>
+  Cn 4 r_ifz
+   [Cn 4 r_result1 [Id 4 0, Id 4 1, Id 4 3],
+    Cn 4 r_ifz
+     [Cn 4 r_result1 [Id 4 0, Id 4 2, Id 4 3],
+      Cn 4 r_prod_encode [r_constn 3 2, r_constn 3 0],
+      Cn 4 r_prod_encode
+       [r_constn 3 1, Cn 4 r_dec [Cn 4 r_result1 [Id 4 0, Id 4 2, Id 4 3]]]],
+    Cn 4 r_prod_encode
+     [r_constn 3 0, Cn 4 r_dec [Cn 4 r_result1 [Id 4 0, Id 4 1, Id 4 3]]]]"
+
+lemma r_both_prim [simp]: "prim_recfn 4 r_both"
+  unfolding r_both_def by simp
+
+lemma r_both:
+  assumes "\<And>x. eval r_phi [i, x] = eval f [x]"
+    and "\<And>x. eval r_phi [j, x] = eval g [x]"
+  shows "eval f [x] \<up> \<and> eval g [x] \<up> \<Longrightarrow> eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)"
+    and "\<lbrakk>eval r_result1 [t, i, x] \<down>= 0; eval r_result1 [t, j, x] \<down>= 0\<rbrakk> \<Longrightarrow>
+      eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)"
+    and "eval r_result1 [t, i, x] \<down>= Suc v \<Longrightarrow>
+      eval r_both [t, i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+    and "\<lbrakk>eval r_result1 [t, i, x] \<down>= 0; eval r_result1 [t, j, x] \<down>= Suc v\<rbrakk> \<Longrightarrow>
+      eval r_both [t, i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+proof -
+  have r_result_total [simp]: "eval r_result [t, k, x] \<down>" for t k x
+    using r_result_total by simp
+  {
+    assume "eval f [x] \<up> \<and> eval g [x] \<up>"
+    then have "eval r_result1 [t, i, x] \<down>= 0" and "eval r_result1 [t, j, x] \<down>= 0"
+      using assms r_result1_diverg' by auto
+    then show "eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)"
+      unfolding r_both_def by simp
+  next
+    assume "eval r_result1 [t, i, x] \<down>= 0" and "eval r_result1 [t, j, x] \<down>= 0"
+    then show "eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)"
+      unfolding r_both_def by simp
+  next
+    assume "eval r_result1 [t, i, x] \<down>= Suc v"
+    moreover from this have "eval r_result1 [t, i, x] \<down>= Suc (the (eval f [x]))"
+      using assms r_result1_Some' by fastforce
+    ultimately show "eval r_both [t, i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+      unfolding r_both_def by auto
+  next
+    assume "eval r_result1 [t, i, x] \<down>= 0" and "eval r_result1 [t, j, x] \<down>= Suc v"
+    moreover from this have "eval r_result1 [t, j, x] \<down>= Suc (the (eval g [x]))"
+      using assms r_result1_Some' by fastforce
+    ultimately show "eval r_both [t, i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+      unfolding r_both_def by auto
+  }
+qed
+
+definition "r_parallel \<equiv>
+  Cn 3 r_both [Mn 3 (Cn 4 r_le [Cn 4 r_pdec1 [r_both], r_constn 3 1]), Id 3 0, Id 3 1, Id 3 2]"
+
+lemma r_parallel_recfn [simp]: "recfn 3 r_parallel"
+  unfolding r_parallel_def by simp
+
+lemma r_parallel:
+  assumes "\<And>x. eval r_phi [i, x] = eval f [x]"
+    and "\<And>x. eval r_phi [j, x] = eval g [x]"
+  shows "eval f [x] \<up> \<and> eval g [x] \<up> \<Longrightarrow> eval r_parallel [i, j, x] \<up>"
+    and "eval f [x] \<down> \<and> eval g [x] \<up> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+    and "eval g [x] \<down> \<and> eval f [x] \<up> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+    and "eval f [x] \<down> \<and> eval g [x] \<down> \<Longrightarrow>
+      eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval f [x])) \<or>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+proof -
+  let ?cond = "Cn 4 r_le [Cn 4 r_pdec1 [r_both], r_constn 3 1]"
+  define m where "m = Mn 3 ?cond"
+  then have m: "r_parallel = Cn 3 r_both [m, Id 3 0, Id 3 1, Id 3 2]"
+    unfolding r_parallel_def by simp
+  from m_def have "recfn 3 m" by simp
+  {
+    assume "eval f [x] \<up> \<and> eval g [x] \<up>"
+    then have "\<forall>t. eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)"
+      using assms r_both by simp
+    then have "eval ?cond [t, i, j, x] \<down>= 1" for t
+      by simp
+    then have "eval m [i, j, x] \<up>"
+      unfolding m_def using eval_Mn_diverg by simp
+    then have "eval (Cn 3 r_both [m, Id 3 0, Id 3 1, Id 3 2]) [i, j, x] \<up>"
+      using `recfn 3 m` by simp
+    then show "eval r_parallel [i, j, x] \<up>"
+      using m by simp
+  next
+    assume "eval f [x] \<down> \<and> eval g [x] \<down>"
+    then obtain vf vg where v: "eval f [x] \<down>= vf" "eval g [x] \<down>= vg"
+      by auto
+    then obtain tf where tf:
+      "\<forall>t\<ge>tf. eval r_result1 [t, i, x] \<down>= Suc vf"
+      "\<forall>t<tf. eval r_result1 [t, i, x] \<down>= 0"
+      using r_result1_converg' assms by metis
+    from v obtain tg where tg:
+      "\<forall>t\<ge>tg. eval r_result1 [t, j, x] \<down>= Suc vg"
+      "\<forall>t<tg. eval r_result1 [t, j, x] \<down>= 0"
+      using r_result1_converg' assms by metis
+    show "eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval f [x])) \<or>
+      eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+    proof (cases "tf \<le> tg")
+      case True
+      with tg(2) have j0: "\<forall>t<tf. eval r_result1 [t, j, x] \<down>= 0"
+        by simp
+      have *: "eval r_both [tf, i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+        using r_both(3) assms tf(1) by simp
+      have "eval m [i, j, x] \<down>= tf"
+        unfolding m_def
+      proof (rule eval_Mn_convergI)
+        show "recfn (length [i, j, x]) (Mn 3 ?cond)" by simp
+        have "eval (Cn 4 r_pdec1 [r_both]) [tf, i, j, x] \<down>= 0"
+          using * by simp
+        then show "eval ?cond [tf, i, j, x] \<down>= 0" by simp
+        have "eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)" if "t < tf" for t
+          using tf(2) r_both(2) assms that j0 by simp
+        then have "eval ?cond [t, i, j, x] \<down>= 1" if "t < tf" for t
+          using that by simp
+        then show "\<And>y. y < tf \<Longrightarrow> eval ?cond [y, i, j, x] \<down>\<noteq> 0" by simp
+      qed
+      moreover have "eval r_parallel [i, j, x] =
+          eval (Cn 3 r_both [m, Id 3 0, Id 3 1, Id 3 2]) [i, j, x]"
+        using m by simp
+      ultimately have "eval r_parallel [i, j, x] = eval r_both [tf, i, j, x]"
+        using `recfn 3 m` by simp
+      with * have "eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+        by simp
+      then show ?thesis by simp
+    next
+      case False
+      with tf(2) have i0: "\<forall>t\<le>tg. eval r_result1 [t, i, x] \<down>= 0"
+        by simp
+      then have *: "eval r_both [tg, i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+        using assms r_both(4) tg(1) by auto
+      have "eval m [i, j, x] \<down>= tg"
+        unfolding m_def
+      proof (rule eval_Mn_convergI)
+        show "recfn (length [i, j, x]) (Mn 3 ?cond)" by simp
+        have "eval (Cn 4 r_pdec1 [r_both]) [tg, i, j, x] \<down>= 1"
+          using * by simp
+        then show "eval ?cond [tg, i, j, x] \<down>= 0" by simp
+        have "eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)" if "t < tg" for t
+          using tg(2) r_both(2) assms that i0 by simp
+        then have "eval ?cond [t, i, j, x] \<down>= 1" if "t < tg" for t
+          using that by simp
+        then show "\<And>y. y < tg \<Longrightarrow> eval ?cond [y, i, j, x] \<down>\<noteq> 0" by simp
+      qed
+      moreover have "eval r_parallel [i, j, x] =
+          eval (Cn 3 r_both [m, Id 3 0, Id 3 1, Id 3 2]) [i, j, x]"
+        using m by simp
+      ultimately have "eval r_parallel [i, j, x] = eval r_both [tg, i, j, x]"
+        using `recfn 3 m` by simp
+      with * have "eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+        by simp
+      then show ?thesis by simp
+    qed
+  next
+    assume eval_fg: "eval g [x] \<down> \<and> eval f [x] \<up>"
+    then have i0: "\<forall>t. eval r_result1 [t, i, x] \<down>= 0"
+      using r_result1_diverg' assms by auto
+    from eval_fg obtain v where "eval g [x] \<down>= v"
+      by auto
+    then obtain t\<^sub>0 where t0:
+      "\<forall>t\<ge>t\<^sub>0. eval r_result1 [t, j, x] \<down>= Suc v"
+      "\<forall>t<t\<^sub>0. eval r_result1 [t, j, x] \<down>= 0"
+      using r_result1_converg' assms by metis
+    then have *: "eval r_both [t\<^sub>0, i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+      using r_both(4) assms i0 by simp
+    have "eval m [i, j, x] \<down>= t\<^sub>0"
+      unfolding m_def
+    proof (rule eval_Mn_convergI)
+      show "recfn (length [i, j, x]) (Mn 3 ?cond)" by simp
+      have "eval (Cn 4 r_pdec1 [r_both]) [t\<^sub>0, i, j, x] \<down>= 1"
+        using * by simp
+      then show "eval ?cond [t\<^sub>0, i, j, x] \<down>= 0" by simp
+      have "eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)" if "t < t\<^sub>0" for t
+        using t0(2) r_both(2) assms that i0 by simp
+      then have "eval ?cond [t, i, j, x] \<down>= 1" if "t < t\<^sub>0" for t
+        using that by simp
+      then show "\<And>y. y < t\<^sub>0 \<Longrightarrow> eval ?cond [y, i, j, x] \<down>\<noteq> 0" by simp
+    qed
+    moreover have "eval r_parallel [i, j, x] =
+        eval (Cn 3 r_both [m, Id 3 0, Id 3 1, Id 3 2]) [i, j, x]"
+      using m by simp
+    ultimately have "eval r_parallel [i, j, x] = eval r_both [t\<^sub>0, i, j, x]"
+      using `recfn 3 m` by simp
+    with * show "eval r_parallel [i, j, x] \<down>= prod_encode (1, the (eval g [x]))"
+      by simp
+  next
+    assume eval_fg: "eval f [x] \<down> \<and> eval g [x] \<up>"
+    then have j0: "\<forall>t. eval r_result1 [t, j, x] \<down>= 0"
+      using r_result1_diverg' assms by auto
+    from eval_fg obtain v where "eval f [x] \<down>= v"
+      by auto
+    then obtain t\<^sub>0 where t0:
+      "\<forall>t\<ge>t\<^sub>0. eval r_result1 [t, i, x] \<down>= Suc v"
+      "\<forall>t<t\<^sub>0. eval r_result1 [t, i, x] \<down>= 0"
+      using r_result1_converg' assms by metis
+    then have *: "eval r_both [t\<^sub>0, i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+      using r_both(3) assms by blast
+    have "eval m [i, j, x] \<down>= t\<^sub>0"
+      unfolding m_def
+    proof (rule eval_Mn_convergI)
+      show "recfn (length [i, j, x]) (Mn 3 ?cond)" by simp
+      have "eval (Cn 4 r_pdec1 [r_both]) [t\<^sub>0, i, j, x] \<down>= 0"
+        using * by simp
+      then show "eval ?cond [t\<^sub>0, i, j, x] \<down>= 0"
+        by simp
+      have "eval r_both [t, i, j, x] \<down>= prod_encode (2, 0)" if "t < t\<^sub>0" for t
+        using t0(2) r_both(2) assms that j0 by simp
+      then have "eval ?cond [t, i, j, x] \<down>= 1" if "t < t\<^sub>0" for t
+        using that by simp
+      then show "\<And>y. y < t\<^sub>0 \<Longrightarrow> eval ?cond [y, i, j, x] \<down>\<noteq> 0" by simp
+    qed
+    moreover have "eval r_parallel [i, j, x] =
+        eval (Cn 3 r_both [m, Id 3 0, Id 3 1, Id 3 2]) [i, j, x]"
+      using m by simp
+    ultimately have "eval r_parallel [i, j, x] = eval r_both [t\<^sub>0, i, j, x]"
+      using `recfn 3 m` by simp
+    with * show "eval r_parallel [i, j, x] \<down>= prod_encode (0, the (eval f [x]))"
+      by simp
+  }
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Inductive_Inference/document/root.bib b/thys/Inductive_Inference/document/root.bib
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/document/root.bib
@@ -0,0 +1,181 @@
+@book{Rogers87,
+  Author = {Hartley {Rogers, Jr.}},
+  Publisher = {The MIT Press},
+  Title = {Theory of Recursive Functions and Effective Computability},
+  Year = {1987},
+  Edition = {2nd}
+}
+
+@Article{Kleene43,
+    Author = "Stephen Cole Kleene",
+    Title = "Recursive predicates and quantifiers",
+    Journal = "Trans. Amer. Math. Soc.",
+    Volume = "53",
+    Number = "1",
+    Year = "1943",
+    Pages = "41--73",
+    doi = "10.1090/S0002-9947-1943-0007371-8"
+}
+
+@misc{wiki-krt,
+    author = "{Wikipedia contributors}",
+    title = "Kleene's recursion theorem --- {Wikipedia}{,} The Free Encyclopedia",
+    year = "2020",
+    url = "https://en.wikipedia.org/w/index.php?title=Kleene%27s_recursion_theorem&oldid=936277979",
+    note = "[Online; accessed 28-March-2020]"
+}
+
+@InCollection{as-ii-87,
+  author =       "Dana Angluin and Carl H. Smith",
+  title =        "Inductive Inference",
+  booktitle =    "Encyclopedia of Artificial Intelligence",
+  publisher =    "J. Wiley and Sons, New York",
+  year =         "1987",
+  pages =        "409--418",
+}
+
+@Article{fkw-iisde-95,
+  author =       "R\={u}si\c{n}\v{s} Freivalds and Efim B. Kinber and
+                 Rolf Wiehagen",
+  title =        "How Inductive Inference Strategies Discover Their
+                 Errors",
+  journal =      "Inform. Comput.",
+  volume =       "118",
+  number =       "2",
+  year =         "1995",
+  pages =        "208--226",
+}
+
+@Article{cs-cicmii-83,
+  author =       "John Case and Carl H. Smith",
+  title =        "Comparison of Identification Criteria for Machine
+                 Inductive Inference",
+  journal =      "Theoret. Comput. Sci.",
+  volume =       "25",
+  year =         "1983",
+  pages =        "193--220",
+  annote =       "Was in STOC78",
+}
+
+@InCollection{b-ttlsf-74,
+  author =       "J. M. Barzdin",
+  title =        "Two Theorems on the Limiting Synthesis of Functions",
+  booktitle =    "Theory of Algorithms and Programs",
+  volume =       "1",
+  publisher =    "Latvian State University, Riga",
+  year =         "1974",
+  pages =        "82--88",
+  note =         "In Russian",
+}
+
+@Article{jb-cpnii-81,
+  author =       "Klaus P. Jantke and Hans-Rainer Beick",
+  title =        "Combining postulates of naturalness in inductive inference",
+  journal =      "Elektronische Informationsverarbeitung und Kybernetik",
+  volume =       "17",
+  number =       "8/9",
+  year =         "1981",
+  pages =        "465--484",
+}
+
+@Article{w-lerfss-76,
+  author =       "Rolf Wiehagen",
+  title =        "Limes-{E}rkennung rekursiver {F}unktionen durch spezielle {S}trategien",
+  journal =      "Journal of Information Processing and Cybernetics (EIK)",
+  volume =       "12",
+  year =         "1976",
+  pages =        "93--99",
+}
+
+@Article{wz-idmowle-94,
+  author =       "Rolf Wiehagen and Thomas Zeugmann",
+  title =        "Ignoring data may be the only way to learn efficiently",
+  journal =      "J. of Experimental and Theoret. Artif. Intell.",
+  volume =       "6",
+  number =       "1",
+  year =         "1994",
+  pages =        "131--144",
+}
+
+@Article{g-lil-67,
+  author =       "E. Mark Gold",
+  title =        "Language Identification in the Limit",
+  journal =      "Inform. Control",
+  volume =       "10",
+  number =       "5",
+  year =         "1967",
+  pages =        "447--474",
+  comment =      "Classic paper, introducing computer science theory
+                 into learning.",
+}
+
+@Article{g-lr-65,
+  author =       "E. M. Gold",
+  title =        "Limiting Recursion",
+  journal =      "J. Symbolic Logic",
+  volume =       "30",
+  year =         "1965",
+  pages =        "28--48",
+}
+
+@Article{s-ftiip1-64,
+  author =       "R. J. Solomonoff",
+  title =        "A Formal Theory of Inductive Inference: Part 1",
+  journal =      "Inform. Control",
+  volume =       "7",
+  year =         "1964",
+  pages =        "1--22",
+  comment =      "Concerned with extrapolation of sequences. Defines
+                 probability of extension via likelihood random TM
+                 program will generate it.",
+}
+
+@Article{s-ftiip2-64,
+  author =       "R. J. Solomonoff",
+  title =        "A Formal Theory of Inductive Inference: Part 2",
+  journal =      "Inform. Control",
+  volume =       "7",
+  year =         "1964",
+  pages =        "224--254",
+  comment =      "Continues Part I. Inference of probabilities and
+                 grammars.",
+}
+
+@InProceedings{b-iiafp-74,
+  author =       "{Ya}. M. Barzdin",
+  title =        "Inductive Inference of Automata, Functions and Programs",
+  booktitle =    "Proceedings International Congress of Mathematics",
+  year =         "1974",
+  venue =        "Vancouver",
+  pages =        "455--460",
+}
+
+@InProceedings{b-iiafp-77,
+  author =       "J. M. Barzdin",
+  title =        "Inductive Inference of Automata, Functions and Programs",
+  booktitle =    "Amer. Math. Soc. Transl.",
+  year =         "1977",
+  pages =        "107--122",
+}
+
+@Article{bb-tmtii-75,
+  author =       "Leonore Blum and Manuel Blum",
+  title =        "Toward a Mathematical Theory of Inductive Inference",
+  journal =      "Inform. Control",
+  volume =       "28",
+  number =       "2",
+  month =        jun,
+  year =         "1975",
+  pages =        "125--155",
+}
+
+@article{Universal_Turing_Machine-AFP,
+  author  = {Jian Xu and Xingyuan Zhang and Christian Urban and Sebastiaan J. C. Joosten},
+  title   = {Universal Turing Machine},
+  journal = {Archive of Formal Proofs},
+  month   = feb,
+  year    = 2019,
+  note    = {\url{http://isa-afp.org/entries/Universal_Turing_Machine.html},
+            Formal proof development},
+  ISSN    = {2150-914x},
+}
diff --git a/thys/Inductive_Inference/document/root.tex b/thys/Inductive_Inference/document/root.tex
new file mode 100644
--- /dev/null
+++ b/thys/Inductive_Inference/document/root.tex
@@ -0,0 +1,71 @@
+\documentclass[11pt,a4paper]{report}
+\usepackage{isabelle,isabellesym}
+
+\usepackage[utf8]{inputenc}
+
+\usepackage[top=3cm,bottom=3cm]{geometry}
+
+\usepackage{amssymb}  % for \mathbb
+
+% this should be the last package used
+\usepackage{pdfsetup}
+
+% urls in roman style, theory text in math-similar italics
+\urlstyle{rm}
+\isabellestyle{it}
+
+\begin{document}
+
+\title{Some classical results in inductive inference of recursive functions}
+\author{Frank J. Balbach}
+\maketitle
+
+\begin{abstract}
+This entry formalizes some classical concepts and results from inductive
+inference of recursive functions. In the basic setting a partial recursive
+function (``strategy'') must identify (``learn'') all functions from a set
+(``class'') of recursive functions. To that end the strategy receives more and
+more values $f(0), f(1), f(2), \ldots$ of some function $f$ from the given class
+and in turn outputs descriptions of partial recursive functions, for example,
+Gödel numbers. The strategy is considered successful if the sequence of outputs
+(``hypotheses'') converges to a description of $f$. A class of functions
+learnable in this sense is called ``learnable in the limit''. The set of all
+these classes is denoted by LIM.
+
+Other types of inference considered are finite learning (FIN), behaviorally
+correct learning in the limit (BC), and some variants of LIM with restrictions
+on the hypotheses: total learning (TOTAL), consistent learning (CONS), and
+class-preserving learning (CP). The main results formalized are the proper
+inclusions $\mathrm{FIN} \subset \mathrm{CP} \subset \mathrm{TOTAL} \subset
+\mathrm{CONS} \subset \mathrm{LIM} \subset \mathrm{BC} \subset 2^{\mathcal{R}}$,
+where $\mathcal{R}$ is the set of all total recursive functions.  Further
+results show that for all these inference types except CONS, strategies can be
+assumed to be total recursive functions; that all inference types but CP are
+closed under the subset relation between classes; and that no inference type is
+closed under the union of classes.
+
+The above is based on a formalization of recursive functions heavily inspired by
+the \emph{Universal Turing Machine} entry by
+Xu~et~al.~\cite{Universal_Turing_Machine-AFP}, but different in that it models
+partial functions with codomain \emph{nat option}. The formalization contains a
+construction of a universal partial recursive function, without resorting to
+Turing machines, introduces decidability and recursive enumerability, and proves
+some standard results: existence of a Kleene normal form, the $s$-$m$-$n$
+theorem, Rice's theorem, and assorted fixed-point theorems (recursion theorems)
+by Kleene, Rogers, and Smullyan.
+\end{abstract}
+
+\tableofcontents
+
+\newpage
+
+% sane default for proof documents
+\parindent 0pt\parskip 0.5ex
+
+% generated text of all theories
+\input{session}
+
+\bibliographystyle{abbrv}
+\bibliography{root}
+
+\end{document}
diff --git a/thys/ROOTS b/thys/ROOTS
--- a/thys/ROOTS
+++ b/thys/ROOTS
@@ -1,553 +1,554 @@
 ADS_Functor
 AODV
 AVL-Trees
 AWN
 Abortable_Linearizable_Modules
 Abs_Int_ITP2012
 Abstract-Hoare-Logics
 Abstract-Rewriting
 Abstract_Completeness
 Abstract_Soundness
 Adaptive_State_Counting
 Affine_Arithmetic
 Aggregation_Algebras
 Akra_Bazzi
 Algebraic_Numbers
 Algebraic_VCs
 Allen_Calculus
 Amicable_Numbers
 Amortized_Complexity
 AnselmGod
 Applicative_Lifting
 Approximation_Algorithms
 Architectural_Design_Patterns
 Aristotles_Assertoric_Syllogistic
 Arith_Prog_Rel_Primes
 ArrowImpossibilityGS
 Attack_Trees
 Auto2_HOL
 Auto2_Imperative_HOL
 AutoFocus-Stream
 Automated_Stateful_Protocol_Verification
 Automatic_Refinement
 AxiomaticCategoryTheory
 BDD
 BNF_CC
 BNF_Operations
 Banach_Steinhaus
 Bell_Numbers_Spivey
 Berlekamp_Zassenhaus
 Bernoulli
 Bertrands_Postulate
 Bicategory
 BinarySearchTree
 Binding_Syntax_Theory
 Binomial-Heaps
 Binomial-Queues
 BirdKMP
 Bondy
 Boolean_Expression_Checkers
 Bounded_Deducibility_Security
 Buchi_Complementation
 Budan_Fourier
 Buffons_Needle
 Buildings
 BytecodeLogicJmlTypes
 C2KA_DistributedSystems
 CAVA_Automata
 CAVA_LTL_Modelchecker
 CCS
 CISC-Kernel
 CRDT
 CYK
 CakeML
 CakeML_Codegen
 Call_Arity
 Card_Equiv_Relations
 Card_Multisets
 Card_Number_Partitions
 Card_Partitions
 Cartan_FP
 Case_Labeling
 Catalan_Numbers
 Category
 Category2
 Category3
 Cauchy
 Cayley_Hamilton
 Certification_Monads
 Chandy_Lamport
 Chord_Segments
 Circus
 Clean
 ClockSynchInst
 Closest_Pair_Points
 CofGroups
 Coinductive
 Coinductive_Languages
 Collections
 Comparison_Sort_Lower_Bound
 Compiling-Exceptions-Correctly
 Complete_Non_Orders
 Completeness
 Complex_Geometry
 Complx
 ComponentDependencies
 ConcurrentGC
 ConcurrentIMP
 Concurrent_Ref_Alg
 Concurrent_Revisions
 Consensus_Refined
 Constructive_Cryptography
 Constructor_Funs
 Containers
 CoreC++
 Core_DOM
 Count_Complex_Roots
 CryptHOL
 CryptoBasedCompositionalProperties
 DFS_Framework
 DPT-SAT-Solver
 DataRefinementIBP
 Datatype_Order_Generator
 Decl_Sem_Fun_PL
 Decreasing-Diagrams
 Decreasing-Diagrams-II
 Deep_Learning
 Density_Compiler
 Dependent_SIFUM_Refinement
 Dependent_SIFUM_Type_Systems
 Depth-First-Search
 Derangements
 Deriving
 Descartes_Sign_Rule
 Dict_Construction
 Differential_Dynamic_Logic
 Differential_Game_Logic
 Dijkstra_Shortest_Path
 Diophantine_Eqns_Lin_Hom
 Dirichlet_L
 Dirichlet_Series
 DiscretePricing
 Discrete_Summation
 DiskPaxos
 DynamicArchitectures
 Dynamic_Tables
 E_Transcendental
 Echelon_Form
 EdmondsKarp_Maxflow
 Efficient-Mergesort
 Elliptic_Curves_Group_Law
 Encodability_Process_Calculi
 Epistemic_Logic
 Ergodic_Theory
 Error_Function
 Euler_MacLaurin
 Euler_Partition
 Example-Submission
 FFT
 FLP
 FOL-Fitting
 FOL_Harrison
 FOL_Seq_Calc1
 Factored_Transition_System_Bounding
 Falling_Factorial_Sum
 Farkas
 FeatherweightJava
 Featherweight_OCL
 Fermat3_4
 FileRefinement
 FinFun
 Finger-Trees
 Finite_Automata_HF
 First_Order_Terms
 First_Welfare_Theorem
 Fishburn_Impossibility
 Fisher_Yates
 Flow_Networks
 Floyd_Warshall
 Flyspeck-Tame
 FocusStreamsCaseStudies
 Forcing
 Formal_SSA
 Formula_Derivatives
 Fourier
 Free-Boolean-Algebra
 Free-Groups
 FunWithFunctions
 FunWithTilings
 Functional-Automata
 Functional_Ordered_Resolution_Prover
 Furstenberg_Topology
 GPU_Kernel_PL
 Gabow_SCC
 Game_Based_Crypto
 Gauss-Jordan-Elim-Fun
 Gauss_Jordan
 Gauss_Sums
 Gaussian_Integers
 GenClock
 General-Triangle
 Generalized_Counting_Sort
 Generic_Deriving
 Generic_Join
 GewirthPGCProof
 Girth_Chromatic
 GoedelGod
 Goodstein_Lambda
 GraphMarkingIBP
 Graph_Saturation
 Graph_Theory
 Green
 Groebner_Bases
 Groebner_Macaulay
 Gromov_Hyperbolicity
 Group-Ring-Module
 HOL-CSP
 HOLCF-Prelude
 HRB-Slicing
 Heard_Of
 Hello_World
 HereditarilyFinite
 Hermite
 Hidden_Markov_Models
 Higher_Order_Terms
 Hoare_Time
 HotelKeyCards
 Huffman
 Hybrid_Logic
 Hybrid_Multi_Lane_Spatial_Logic
 Hybrid_Systems_VCs
 HyperCTL
 IEEE_Floating_Point
 IMAP-CRDT
 IMO2019
 IMP2
 IMP2_Binary_Heap
 IP_Addresses
 Imperative_Insertion_Sort
 Impossible_Geometry
 Incompleteness
 Incredible_Proof_Machine
 Inductive_Confidentiality
+Inductive_Inference
 InfPathElimination
 InformationFlowSlicing
 InformationFlowSlicing_Inter
 Integration
 Interval_Arithmetic_Word32
 Iptables_Semantics
 Irrational_Series_Erdos_Straus
 Irrationality_J_Hancl
 Isabelle_C
 Isabelle_Meta_Model
 Jacobson_Basic_Algebra
 Jinja
 JinjaThreads
 JiveDataStoreModel
 Jordan_Hoelder
 Jordan_Normal_Form
 KAD
 KAT_and_DRA
 KBPs
 KD_Tree
 Key_Agreement_Strong_Adversaries
 Kleene_Algebra
 Knot_Theory
 Knuth_Bendix_Order
 Knuth_Morris_Pratt
 Koenigsberg_Friendship
 Kruskal
 Kuratowski_Closure_Complement
 LLL_Basis_Reduction
 LLL_Factorization
 LOFT
 LTL
 LTL_Master_Theorem
 LTL_Normal_Form
 LTL_to_DRA
 LTL_to_GBA
 Lam-ml-Normalization
 LambdaAuth
 LambdaMu
 Lambda_Free_EPO
 Lambda_Free_KBOs
 Lambda_Free_RPOs
 Lambert_W
 Landau_Symbols
 Laplace_Transform
 Latin_Square
 LatticeProperties
 Launchbury
 Lazy-Lists-II
 Lazy_Case
 Lehmer
 Lifting_Definition_Option
 LightweightJava
 LinearQuantifierElim
 Linear_Inequalities
 Linear_Programming
 Linear_Recurrences
 Liouville_Numbers
 List-Index
 List-Infinite
 List_Interleaving
 List_Inversions
 List_Update
 LocalLexing
 Localization_Ring
 Locally-Nameless-Sigma
 Lowe_Ontological_Argument
 Lower_Semicontinuous
 Lp
 Lucas_Theorem
 MFMC_Countable
 MFODL_Monitor_Optimized
 MFOTL_Monitor
 MSO_Regex_Equivalence
 Markov_Models
 Marriage
 Mason_Stothers
 Matrices_for_ODEs
 Matrix
 Matrix_Tensor
 Matroids
 Max-Card-Matching
 Median_Of_Medians_Selection
 Menger
 Mersenne_Primes
 MiniML
 Minimal_SSA
 Minkowskis_Theorem
 Minsky_Machines
 Modal_Logics_for_NTS
 Modular_Assembly_Kit_Security
 Monad_Memo_DP
 Monad_Normalisation
 MonoBoolTranAlgebra
 MonoidalCategory
 Monomorphic_Monad
 MuchAdoAboutTwo
 Multi_Party_Computation
 Multirelations
 Myhill-Nerode
 Name_Carrying_Type_Inference
 Nash_Williams
 Nat-Interval-Logic
 Native_Word
 Nested_Multisets_Ordinals
 Network_Security_Policy_Verification
 Neumann_Morgenstern_Utility
 No_FTL_observers
 Nominal2
 Noninterference_CSP
 Noninterference_Concurrent_Composition
 Noninterference_Generic_Unwinding
 Noninterference_Inductive_Unwinding
 Noninterference_Ipurge_Unwinding
 Noninterference_Sequential_Composition
 NormByEval
 Nullstellensatz
 Octonions
 OpSets
 Open_Induction
 Optics
 Optimal_BST
 Orbit_Stabiliser
 Order_Lattice_Props
 Ordered_Resolution_Prover
 Ordinal
 Ordinal_Partitions
 Ordinals_and_Cardinals
 Ordinary_Differential_Equations
 PCF
 PLM
 POPLmark-deBruijn
 PSemigroupsConvolution
 PAC_Checker
 Pairing_Heap
 Paraconsistency
 Parity_Game
 Partial_Function_MR
 Partial_Order_Reduction
 Password_Authentication_Protocol
 Pell
 Perfect-Number-Thm
 Perron_Frobenius
 Pi_Calculus
 Pi_Transcendental
 Planarity_Certificates
 Poincare_Bendixson
 Poincare_Disc
 Polynomial_Factorization
 Polynomial_Interpolation
 Polynomials
 Pop_Refinement
 Posix-Lexing
 Possibilistic_Noninterference
 Power_Sum_Polynomials
 Pratt_Certificate
 Presburger-Automata
 Prim_Dijkstra_Simple
 Prime_Distribution_Elementary
 Prime_Harmonic_Series
 Prime_Number_Theorem
 Priority_Queue_Braun
 Priority_Search_Trees
 Probabilistic_Noninterference
 Probabilistic_Prime_Tests
 Probabilistic_System_Zoo
 Probabilistic_Timed_Automata
 Probabilistic_While
 Program-Conflict-Analysis
 Projective_Geometry
 Promela
 Proof_Strategy_Language
 PropResPI
 Propositional_Proof_Systems
 Prpu_Maxflow
 PseudoHoops
 Psi_Calculi
 Ptolemys_Theorem
 QHLProver
 QR_Decomposition
 Quantales
 Quaternions
 Quick_Sort_Cost
 RIPEMD-160-SPARK
 ROBDD
 RSAPSS
 Ramsey-Infinite
 Random_BSTs
 Random_Graph_Subgraph_Threshold
 Randomised_BSTs
 Randomised_Social_Choice
 Rank_Nullity_Theorem
 Real_Impl
 Recursion-Addition
 Recursion-Theory-I
 Refine_Imperative_HOL
 Refine_Monadic
 RefinementReactive
 Regex_Equivalence
 Regular-Sets
 Regular_Algebras
 Relation_Algebra
 Relational-Incorrectness-Logic
 Relational_Disjoint_Set_Forests
 Relational_Paths
 Rep_Fin_Groups
 Residuated_Lattices
 Resolution_FOL
 Rewriting_Z
 Ribbon_Proofs
 Robbins-Conjecture
 Root_Balanced_Tree
 Routing
 Roy_Floyd_Warshall
 SATSolverVerification
 SDS_Impossibility
 SIFPL
 SIFUM_Type_Systems
 SPARCv8
 Safe_Distance
 Safe_OCL
 Saturation_Framework
 Secondary_Sylow
 Security_Protocol_Refinement
 Selection_Heap_Sort
 SenSocialChoice
 Separata
 Separation_Algebra
 Separation_Logic_Imperative_HOL
 SequentInvertibility
 Shivers-CFA
 ShortestPath
 Show
 Sigma_Commit_Crypto
 Signature_Groebner
 Simpl
 Simple_Firewall
 Simplex
 Skew_Heap
 Skip_Lists
 Slicing
 Sliding_Window_Algorithm
 Smith_Normal_Form
 Smooth_Manifolds
 Sort_Encodings
 Source_Coding_Theorem
 Special_Function_Bounds
 Splay_Tree
 Sqrt_Babylonian
 Stable_Matching
 Statecharts
 Stateful_Protocol_Composition_and_Typing
 Stellar_Quorums
 Stern_Brocot
 Stewart_Apollonius
 Stirling_Formula
 Stochastic_Matrices
 Stone_Algebras
 Stone_Kleene_Relation_Algebras
 Stone_Relation_Algebras
 Store_Buffer_Reduction
 Stream-Fusion
 Stream_Fusion_Code
 Strong_Security
 Sturm_Sequences
 Sturm_Tarski
 Stuttering_Equivalence
 Subresultants
 Subset_Boolean_Algebras
 SumSquares
 SuperCalc
 Surprise_Paradox
 Symmetric_Polynomials
 Szpilrajn
 TESL_Language
 TLA
 Tail_Recursive_Functions
 Tarskis_Geometry
 Taylor_Models
 Timed_Automata
 Topology
 TortoiseHare
 Transcendence_Series_Hancl_Rucki
 Transformer_Semantics
 Transition_Systems_and_Automata
 Transitive-Closure
 Transitive-Closure-II
 Treaps
 Tree-Automata
 Tree_Decomposition
 Triangle
 Trie
 Twelvefold_Way
 Tycon
 Types_Tableaus_and_Goedels_God
 UPF
 UPF_Firewall
 UTP
 Universal_Turing_Machine
 UpDown_Scheme
 Valuation
 VectorSpace
 VeriComp
 Verified-Prover
 VerifyThis2018
 VerifyThis2019
 Vickrey_Clarke_Groves
 VolpanoSmith
 WHATandWHERE_Security
 WOOT_Strong_Eventual_Consistency
 WebAssembly
 Weight_Balanced_Trees
 Well_Quasi_Orders
 Winding_Number_Eval
 Word_Lib
 WorkerWrapper
 XML
 ZFC_in_HOL
 Zeta_3_Irrational
 Zeta_Function
 pGCL