Theory HOL-Library.Omega_Words_Fun

(*
    Author:     Stefan Merz
    Author:     Salomon Sickert
    Author:     Julian Brunner
    Author:     Peter Lammich
*)

section $\omega$-words

theory Omega_Words_Fun

imports Infinite_Set
begin

text Note: This theory is based on Stefan Merz's work.

text 
  Automata recognize languages, which are sets of words. For the
  theory of $\omega$-automata, we are mostly interested in
  $\omega$-words, but it is sometimes useful to reason about
  finite words, too. We are modeling finite words as lists; this
  lets us benefit from the existing library. Other formalizations
  could be investigated, such as representing words as functions
  whose domains are initial intervals of the natural numbers.



subsection Type declaration and elementary operations

text 
  We represent $\omega$-words as functions from the natural numbers
  to the alphabet type. Other possible formalizations include
  a coinductive definition or a uniform encoding of finite and
  infinite words, as studied by Müller et al.


type_synonym
  'a word = "nat  'a"

text 
  We can prefix a finite word to an $\omega$-word, and a way
  to obtain an $\omega$-word from a finite, non-empty word is by
  $\omega$-iteration.


definition
  conc :: "['a list, 'a word]  'a word"  (infixr  65)
  where "w  x == λn. if n < length w then w!n else x (n - length w)"

definition
  iter :: "'a list  'a word"  ((_ω) [1000])
  where "iter w == if w = [] then undefined else (λn. w!(n mod (length w)))"

lemma conc_empty[simp]: "[]  w = w"
  unfolding conc_def by auto

lemma conc_fst[simp]: "n < length w  (w  x) n = w!n"
  by (simp add: conc_def)

lemma conc_snd[simp]: "¬(n < length w)  (w  x) n = x (n - length w)"
  by (simp add: conc_def)

lemma iter_nth [simp]: "0 < length w  wω n = w!(n mod (length w))"
  by (simp add: iter_def)

lemma conc_conc[simp]: "u  v  w = (u @ v)  w" (is "?lhs = ?rhs")
proof
  fix n
  have u: "n < length u  ?lhs n = ?rhs n"
    by (simp add: conc_def nth_append)
  have v: " ¬(n < length u); n < length u + length v   ?lhs n = ?rhs n"
    by (simp add: conc_def nth_append, arith)
  have w: "¬(n < length u + length v)  ?lhs n = ?rhs n"
    by (simp add: conc_def nth_append, arith)
  from u v w show "?lhs n = ?rhs n" by blast
qed

lemma range_conc[simp]: "range (w1  w2) = set w1  range w2"
proof (intro equalityI subsetI)
  fix a
  assume "a  range (w1  w2)"
  then obtain i where 1: "a = (w1  w2) i" by auto
  then show "a  set w1  range w2"
    unfolding 1 by (cases "i < length w1") simp_all
next
  fix a
  assume a: "a  set w1  range w2"
  then show "a  range (w1  w2)"
  proof
    assume "a  set w1"
    then obtain i where 1: "i < length w1" "a = w1 ! i"
      using in_set_conv_nth by metis
    show ?thesis
    proof
      show "a = (w1  w2) i" using 1 by auto
      show "i  UNIV" by rule
    qed
  next
    assume "a  range w2"
    then obtain i where 1: "a = w2 i" by auto
    show ?thesis
    proof
      show "a = (w1  w2) (length w1 + i)" using 1 by simp
      show "length w1 + i  UNIV" by rule
    qed
  qed
qed


lemma iter_unroll: "0 < length w  wω = w  wω"
  by (simp add: fun_eq_iff mod_if)


subsection Subsequence, Prefix, and Suffix

definition suffix :: "[nat, 'a word]  'a word"
  where "suffix k x  λn. x (k+n)"

definition subsequence :: "'a word  nat  nat  'a list"  (_ [_  _] 900)
  where "subsequence w i j  map w [i..<j]"

abbreviation prefix :: "nat  'a word  'a list"
  where "prefix n w  subsequence w 0 n"

lemma suffix_nth [simp]: "(suffix k x) n = x (k+n)"
  by (simp add: suffix_def)

lemma suffix_0 [simp]: "suffix 0 x = x"
  by (simp add: suffix_def)

lemma suffix_suffix [simp]: "suffix m (suffix k x) = suffix (k+m) x"
  by (rule ext) (simp add: suffix_def add.assoc)

lemma subsequence_append: "prefix (i + j) w = prefix i w @ (w [i  i + j])"
  unfolding map_append[symmetric] upt_add_eq_append[OF le0] subsequence_def ..

lemma subsequence_drop[simp]: "drop i (w [j  k]) = w [j + i  k]"
  by (simp add: subsequence_def drop_map)

lemma subsequence_empty[simp]: "w [i  j] = []  j  i"
  by (auto simp add: subsequence_def)

lemma subsequence_length[simp]: "length (subsequence w i j) = j - i"
  by (simp add: subsequence_def)

lemma subsequence_nth[simp]: "k < j - i  (w [i  j]) ! k = w (i + k)"
  unfolding subsequence_def
  by auto

lemma subseq_to_zero[simp]: "w[i0] = []"
  by simp

lemma subseq_to_smaller[simp]: "ij  w[ij] = []"
  by simp

lemma subseq_to_Suc[simp]: "ij  w [i  Suc j] = w [ i  j ] @ [w j]"
  by (auto simp: subsequence_def)

lemma subsequence_singleton[simp]: "w [i  Suc i] = [w i]"
  by (auto simp: subsequence_def)


lemma subsequence_prefix_suffix: "prefix (j - i) (suffix i w) = w [i  j]"
proof (cases "i  j")
  case True
  have "w [i  j] = map w (map (λn. n + i) [0..<j - i])"
    unfolding map_add_upt subsequence_def
    using le_add_diff_inverse2[OF True] by force
  also
  have " = map (λn. w (n + i)) [0..<j - i]"
    unfolding map_map comp_def by blast
  finally
  show ?thesis
    unfolding subsequence_def suffix_def add.commute[of i] by simp
next
  case False
  then show ?thesis
    by (simp add: subsequence_def)
qed

lemma prefix_suffix: "x = prefix n x  (suffix n x)"
  by (rule ext) (simp add: subsequence_def conc_def)

declare prefix_suffix[symmetric, simp]


lemma word_split: obtains v1 v2 where "v = v1  v2" "length v1 = k"
proof
  show "v = prefix k v  suffix k v"
    by (rule prefix_suffix)
  show "length (prefix k v) = k"
    by simp
qed


lemma set_subsequence[simp]: "set (w[ij]) = w`{i..<j}"
  unfolding subsequence_def by auto

lemma subsequence_take[simp]: "take i (w [j  k]) = w [j  min (j + i) k]"
  by (simp add: subsequence_def take_map min_def)

lemma subsequence_shift[simp]: "(suffix i w) [j  k] = w [i + j  i + k]"
  by (metis add_diff_cancel_left subsequence_prefix_suffix suffix_suffix)

lemma suffix_subseq_join[simp]: "i  j  v [i  j]  suffix j v = suffix i v"
  by (metis (no_types, lifting) Nat.add_0_right le_add_diff_inverse prefix_suffix
    subsequence_shift suffix_suffix)

lemma prefix_conc_fst[simp]:
  assumes "j  length w"
  shows "prefix j (w  w') = take j w"
proof -
  have "i < j. (prefix j (w  w')) ! i = (take j w) ! i"
    using assms by (simp add: conc_fst subsequence_def)
  thus ?thesis
    by (simp add: assms list_eq_iff_nth_eq min.absorb2)
qed

lemma prefix_conc_snd[simp]:
  assumes "n  length u"
  shows "prefix n (u  v) = u @ prefix (n - length u) v"
proof (intro nth_equalityI)
  show "length (prefix n (u  v)) = length (u @ prefix (n - length u) v)"
    using assms by simp
  fix i
  assume "i < length (prefix n (u  v))"
  then show "prefix n (u  v) ! i = (u @ prefix (n - length u) v) ! i"
    by (cases "i < length u") (auto simp: nth_append)
qed

lemma prefix_conc_length[simp]: "prefix (length w) (w  w') = w"
  by simp

lemma suffix_conc_fst[simp]:
  assumes "n  length u"
  shows "suffix n (u  v) = drop n u  v"
proof
  show "suffix n (u  v) i = (drop n u  v) i" for i
    using assms by (cases "n + i < length u") (auto simp: algebra_simps)
qed

lemma suffix_conc_snd[simp]:
  assumes "n  length u"
  shows "suffix n (u  v) = suffix (n - length u) v"
proof
  show "suffix n (u  v) i = suffix (n - length u) v i" for i
    using assms by simp
qed

lemma suffix_conc_length[simp]: "suffix (length w) (w  w') = w'"
  unfolding conc_def by force

lemma concat_eq[iff]:
  assumes "length v1 = length v2"
  shows "v1  u1 = v2  u2  v1 = v2  u1 = u2"
  (is "?lhs  ?rhs")
proof
  assume ?lhs
  then have 1: "(v1  u1) i = (v2  u2) i" for i by auto
  show ?rhs
  proof (intro conjI ext nth_equalityI)
    show "length v1 = length v2" by (rule assms(1))
  next
    fix i
    assume 2: "i < length v1"
    have 3: "i < length v2" using assms(1) 2 by simp
    show "v1 ! i = v2 ! i" using 1[of i] 2 3 by simp
  next
    show "u1 i = u2 i" for i
      using 1[of "length v1 + i"] assms(1) by simp
  qed
next
  assume ?rhs
  then show ?lhs by simp
qed

lemma same_concat_eq[iff]: "u  v = u  w  v = w"
  by simp

lemma comp_concat[simp]: "f  u  v = map f u  (f  v)"
proof
  fix i
  show "(f  u  v) i = (map f u  (f  v)) i"
    by (cases "i < length u") simp_all
qed


subsection Prepending

primrec build :: "'a  'a word  'a word"  (infixr ## 65)
  where "(a ## w) 0 = a" | "(a ## w) (Suc i) = w i"

lemma build_eq[iff]: "a1 ## w1 = a2 ## w2  a1 = a2  w1 = w2"
proof
  assume 1: "a1 ## w1 = a2 ## w2"
  have 2: "(a1 ## w1) i = (a2 ## w2) i" for i
    using 1 by auto
  show "a1 = a2  w1 = w2"
  proof (intro conjI ext)
    show "a1 = a2"
      using 2[of "0"] by simp
    show "w1 i = w2 i" for i
      using 2[of "Suc i"] by simp
  qed
next
  assume 1: "a1 = a2  w1 = w2"
  show "a1 ## w1 = a2 ## w2" using 1 by simp
qed

lemma build_cons[simp]: "(a # u)  v = a ## u  v"
proof
  fix i
  show "((a # u)  v) i = (a ## u  v) i"
  proof (cases i)
    case 0
    show ?thesis unfolding 0 by simp
  next
    case (Suc j)
    show ?thesis unfolding Suc by (cases "j < length u", simp+)
  qed
qed

lemma build_append[simp]: "(w @ a # u)  v = w  a ## u  v"
  unfolding conc_conc[symmetric] by simp

lemma build_first[simp]: "w 0 ## suffix (Suc 0) w = w"
proof
  show "(w 0 ## suffix (Suc 0) w) i = w i" for i
    by (cases i) simp_all
qed

lemma build_split[intro]: "w = w 0 ## suffix 1 w"
  by simp

lemma build_range[simp]: "range (a ## w) = insert a (range w)"
proof safe
  show "(a ## w) i  range w  (a ## w) i = a" for i
    by (cases i) auto
  show "a  range (a ## w)"
  proof (rule range_eqI)
    show "a = (a ## w) 0" by simp
  qed
  show "w i  range (a ## w)" for i
  proof (rule range_eqI)
    show "w i = (a ## w) (Suc i)" by simp
  qed
qed

lemma suffix_singleton_suffix[simp]: "w i ## suffix (Suc i) w = suffix i w"
  using suffix_subseq_join[of i "Suc i" w]
  by simp

text Find the first occurrence of a letter from a given set
lemma word_first_split_set:
  assumes "A  range w  {}"
  obtains u a v where "w = u  [a]  v" "A  set u = {}" "a  A"
proof -
  define i where "i = (LEAST i. w i  A)"
  show ?thesis
  proof
    show "w = prefix i w  [w i]  suffix (Suc i) w"
      by simp
    show "A  set (prefix i w) = {}"
      apply safe
      subgoal premises prems for a
      proof -
        from prems obtain k where 3: "k < i" "w k = a"
          by auto
        have 4: "w k  A"
          using not_less_Least 3(1) unfolding i_def .
        show ?thesis
          using prems(1) 3(2) 4 by auto
      qed
      done
    show "w i  A"
      using LeastI assms(1) unfolding i_def by fast
  qed
qed


subsection The limit set of an $\omega$-word

text 
  The limit set (also called infinity set) of an $\omega$-word
  is the set of letters that appear infinitely often in the word.
  This set plays an important role in defining acceptance conditions
  of $\omega$-automata.


definition limit :: "'a word  'a set"
  where "limit x  {a . n . x n = a}"

lemma limit_iff_frequent: "a  limit x  (n . x n = a)"
  by (simp add: limit_def)

text 
  The following is a different way to define the limit,
  using the reverse image, making the laws about reverse
  image applicable to the limit set.
  (Might want to change the definition above?)


lemma limit_vimage: "(a  limit x) = infinite (x -` {a})"
  by (simp add: limit_def Inf_many_def vimage_def)

lemma two_in_limit_iff:
  "({a, b}  limit x) =
    ((n. x n =a )  (n. x n = a  (m>n. x m = b))  (m. x m = b  (n>m. x n = a)))"
  (is "?lhs = (?r1  ?r2  ?r3)")
proof
  assume lhs: "?lhs"
  hence 1: "?r1" by (auto simp: limit_def elim: INFM_EX)
  from lhs have "n. m>n. x m = b" by (auto simp: limit_def INFM_nat)
  hence 2: "?r2" by simp
  from lhs have "m. n>m. x n = a" by (auto simp: limit_def INFM_nat)
  hence 3: "?r3" by simp
  from 1 2 3 show "?r1  ?r2  ?r3" by simp
next
  assume "?r1  ?r2  ?r3"
  hence 1: "?r1" and 2: "?r2" and 3: "?r3" by simp+
  have infa: "m. nm. x n = a"
  proof
    fix m
    show "nm. x n = a" (is "?A m")
    proof (induct m)
      from 1 show "?A 0" by simp
    next
      fix m
      assume ih: "?A m"
      then obtain n where n: "n  m" "x n = a" by auto
      with 2 obtain k where k: "k>n" "x k = b" by auto
      with 3 obtain l where l: "l>k" "x l = a" by auto
      from n k l have "l  Suc m" by auto
      with l show "?A (Suc m)" by auto
    qed
  qed
  hence infa': "n. x n = a" by (simp add: INFM_nat_le)
  have "n. m>n. x m = b"
  proof
    fix n
    from infa obtain k where k1: "kn" and k2: "x k = a" by auto
    from 2 k2 obtain l where l1: "l>k" and l2: "x l = b" by auto
    from k1 l1 have "l > n" by auto
    with l2 show "m>n. x m = b" by auto
  qed
  hence "m. x m = b" by (simp add: INFM_nat)
  with infa' show "?lhs" by (auto simp: limit_def)
qed

text 
  For $\omega$-words over a finite alphabet, the limit set is
  non-empty. Moreover, from some position onward, any such word
  contains only letters from its limit set.


lemma limit_nonempty:
  assumes fin: "finite (range x)"
  shows "a. a  limit x"
proof -
  from fin obtain a where "a  range x  infinite (x -` {a})"
    by (rule inf_img_fin_domE) auto
  hence "a  limit x"
    by (auto simp add: limit_vimage)
  thus ?thesis ..
qed

lemmas limit_nonemptyE = limit_nonempty[THEN exE]

lemma limit_inter_INF:
  assumes hyp: "limit w  S  {}"
  shows " n. w n  S"
proof -
  from hyp obtain x where " n. w n = x" and "x  S"
    by (auto simp add: limit_def)
  thus ?thesis
    by (auto elim: INFM_mono)
qed

text 
  The reverse implication is true only if $S$ is finite.


lemma INF_limit_inter:
  assumes hyp: " n. w n   S"
    and fin: "finite (S  range w)"
  shows  "a. a  limit w  S"
proof (rule ccontr)
  assume contra: "¬(a. a  limit w  S)"
  hence "aS. finite {n. w n = a}"
    by (auto simp add: limit_def Inf_many_def)
  with fin have "finite (UN a:S  range w. {n. w n = a})"
    by auto
  moreover
  have "(UN a:S  range w. {n. w n = a}) = {n. w n  S}"
    by auto
  moreover
  note hyp
  ultimately show "False"
    by (simp add: Inf_many_def)
qed

lemma fin_ex_inf_eq_limit: "finite A  (i. w i  A)  limit w  A  {}"
  by (metis INF_limit_inter equals0D finite_Int limit_inter_INF)

lemma limit_in_range_suffix: "limit x  range (suffix k x)"
proof
  fix a
  assume "a  limit x"
  then obtain l where
    kl: "k < l" and xl: "x l = a"
    by (auto simp add: limit_def INFM_nat)
  from kl obtain m where "l = k+m"
    by (auto simp add:  less_iff_Suc_add)
  with xl show "a  range (suffix k x)"
    by auto
qed

lemma limit_in_range: "limit r  range r"
  using limit_in_range_suffix[of r 0] by simp

lemmas limit_in_range_suffixD = limit_in_range_suffix[THEN subsetD]

lemma limit_subset: "limit f  f ` {n..}"
  using limit_in_range_suffix[of f n] unfolding suffix_def by auto

theorem limit_is_suffix:
  assumes fin: "finite (range x)"
  shows "k. limit x = range (suffix k x)"
proof -
  have "k. range (suffix k x)  limit x"
  proof -
    ― ‹The set of letters that are not in the limit is certainly finite.
    from fin have "finite (range x - limit x)"
      by simp
    ― ‹Moreover, any such letter occurs only finitely often
    moreover
    have "a  range x - limit x. finite (x -` {a})"
      by (auto simp add: limit_vimage)
    ― ‹Thus, there are only finitely many occurrences of such letters.
    ultimately have "finite (UN a : range x - limit x. x -` {a})"
      by (blast intro: finite_UN_I)
    ― ‹Therefore these occurrences are within some initial interval.
    then obtain k where "(UN a : range x - limit x. x -` {a})  {..<k}"
      by (blast dest: finite_nat_bounded)
    ― ‹This is just the bound we are looking for.
    hence "m. k  m  x m  limit x"
      by (auto simp add: limit_vimage)
    hence "range (suffix k x)  limit x"
      by auto
    thus ?thesis ..
  qed
  then obtain k where "range (suffix k x)  limit x" ..
  with limit_in_range_suffix
  have "limit x = range (suffix k x)"
    by (rule subset_antisym)
  thus ?thesis ..
qed

lemmas limit_is_suffixE = limit_is_suffix[THEN exE]


text 
  The limit set enjoys some simple algebraic laws with respect
  to concatenation, suffixes, iteration, and renaming.


theorem limit_conc [simp]: "limit (w  x) = limit x"
proof (auto)
  fix a assume a: "a  limit (w  x)"
  have "m. n. m<n  x n = a"
  proof
    fix m
    from a obtain n where "m + length w < n  (w  x) n = a"
      by (auto simp add: limit_def Inf_many_def infinite_nat_iff_unbounded)
    hence "m < n - length w  x (n - length w) = a"
      by (auto simp add: conc_def)
    thus "n. m<n  x n = a" ..
  qed
  hence "infinite {n . x n = a}"
    by (simp add: infinite_nat_iff_unbounded)
  thus "a  limit x"
    by (simp add: limit_def Inf_many_def)
next
  fix a assume a: "a  limit x"
  have "m. length w < m  (n. m<n  (w  x) n = a)"
  proof (clarify)
    fix m
    assume m: "length w < m"
    with a obtain n where "m - length w < n  x n = a"
      by (auto simp add: limit_def Inf_many_def infinite_nat_iff_unbounded)
    with m have "m < n + length w  (w  x) (n + length w) = a"
      by (simp add: conc_def, arith)
    thus "n. m<n  (w  x) n = a" ..
  qed
  hence "infinite {n . (w  x) n = a}"
    by (simp add: unbounded_k_infinite)
  thus "a  limit (w  x)"
    by (simp add: limit_def Inf_many_def)
qed

theorem limit_suffix [simp]: "limit (suffix n x) = limit x"
proof -
  have "x = (prefix n x)  (suffix n x)"
    by (simp add: prefix_suffix)
  hence "limit x = limit (prefix n x  suffix n x)"
    by simp
  also have " = limit (suffix n x)"
    by (rule limit_conc)
  finally show ?thesis
    by (rule sym)
qed

theorem limit_iter [simp]:
  assumes nempty: "0 < length w"
  shows "limit wω = set w"
proof
  have "limit wω  range wω"
    by (auto simp add: limit_def dest: INFM_EX)
  also from nempty have "  set w"
    by auto
  finally show "limit wω  set w" .
next
  {
    fix a assume a: "a  set w"
    then obtain k where k: "k < length w  w!k = a"
      by (auto simp add: set_conv_nth)
    ― ‹the following bound is terrible, but it simplifies the proof
    from nempty k have "m. wω ((Suc m)*(length w) + k) = a"
      by (simp add: mod_add_left_eq [symmetric])
    moreover
    ― ‹why is the following so hard to prove??
    have "m. m < (Suc m)*(length w) + k"
    proof
      fix m
      from nempty have "1  length w" by arith
      hence "m*1  m*length w" by simp
      hence "m  m*length w" by simp
      with nempty have "m < length w + (m*length w) + k" by arith
      thus "m < (Suc m)*(length w) + k" by simp
    qed
    moreover note nempty
    ultimately have "a  limit wω"
      by (auto simp add: limit_iff_frequent INFM_nat)
  }
  then show "set w  limit wω" by auto
qed

lemma limit_o [simp]:
  assumes a: "a  limit w"
  shows "f a  limit (f  w)"
proof -
  from a
  have "n. w n = a"
    by (simp add: limit_iff_frequent)
  hence "n. f (w n) = f a"
    by (rule INFM_mono, simp)
  thus "f a  limit (f  w)"
    by (simp add: limit_iff_frequent)
qed

text 
  The converse relation is not true in general: $f(a)$ can be in the
  limit of $f \circ w$ even though $a$ is not in the limit of $w$.
  However, limit› commutes with renaming if the function is
  injective. More generally, if $f(a)$ is the image of only finitely
  many elements, some of these must be in the limit of $w$.


lemma limit_o_inv:
  assumes fin: "finite (f -` {x})"
    and x: "x  limit (f  w)"
  shows "a  (f -` {x}). a  limit w"
proof (rule ccontr)
  assume contra: "¬ ?thesis"
  ― ‹hence, every element in the pre-image occurs only finitely often
  then have "a  (f -` {x}). finite {n. w n = a}"
    by (simp add: limit_def Inf_many_def)
  ― ‹so there are only finitely many occurrences of any such element
  with fin have "finite ( a  (f -` {x}). {n. w n = a})"
    by auto
  ― ‹these are precisely those positions where $x$ occurs in $f \circ w$
  moreover
  have "( a  (f -` {x}). {n. w n = a}) = {n. f(w n) = x}"
    by auto
  ultimately
  ― ‹so $x$ can occur only finitely often in the translated word
  have "finite {n. f(w n) = x}"
    by simp
  ― ‹\ldots\ which yields a contradiction
  with x show "False"
    by (simp add: limit_def Inf_many_def)
qed

theorem limit_inj [simp]:
  assumes inj: "inj f"
  shows "limit (f  w) = f ` (limit w)"
proof
  show "f ` limit w  limit (f  w)"
    by auto
  show "limit (f  w)  f ` limit w"
  proof
    fix x
    assume x: "x  limit (f  w)"
    from inj have "finite (f -` {x})"
      by (blast intro: finite_vimageI)
    with x obtain a where a: "a  (f -` {x})  a  limit w"
      by (blast dest: limit_o_inv)
    thus "x  f ` (limit w)"
      by auto
  qed
qed

lemma limit_inter_empty:
  assumes fin: "finite (range w)"
  assumes hyp: "limit w  S = {}"
  shows "n. w n  S"
proof -
  from fin obtain k where k_def: "limit w = range (suffix k w)"
    using limit_is_suffix by blast
  have "w (k + k')  S" for k'
    using hyp unfolding k_def suffix_def image_def by blast
  thus ?thesis
    unfolding MOST_nat_le using le_Suc_ex by blast
qed

text If the limit is the suffix of the sequence's range,
  we may increase the suffix index arbitrarily
lemma limit_range_suffix_incr:
  assumes "limit r = range (suffix i r)"
  assumes "ji"
  shows "limit r = range (suffix j r)"
    (is "?lhs = ?rhs")
proof -
  have "?lhs = range (suffix i r)"
    using assms by simp
  moreover
  have "  ?rhs" using ji
    by (metis (mono_tags, lifting) assms(2)
        image_subsetI le_Suc_ex range_eqI suffix_def suffix_suffix)
  moreover
  have "  ?lhs" by (rule limit_in_range_suffix)
  ultimately
  show "?lhs = ?rhs"
    by (metis antisym_conv limit_in_range_suffix)
qed

text For two finite sequences, we can find a common suffix index such
  that the limits can be represented as these suffixes' ranges.
lemma common_range_limit:
  assumes "finite (range x)"
    and "finite (range y)"
  obtains i where "limit x = range (suffix i x)"
    and "limit y = range (suffix i y)"
proof -
  obtain i j where 1: "limit x = range (suffix i x)"
    and 2: "limit y = range (suffix j y)"
    using assms limit_is_suffix by metis
  have "limit x = range (suffix (max i j) x)"
    and "limit y = range (suffix (max i j) y)"
    using limit_range_suffix_incr[OF 1] limit_range_suffix_incr[OF 2]
    by auto
  thus ?thesis
    using that by metis
qed


subsection Index sequences and piecewise definitions

text 
  A word can be defined piecewise: given a sequence of words $w_0, w_1, \ldots$
  and a strictly increasing sequence of integers $i_0, i_1, \ldots$ where $i_0=0$,
  a single word is obtained by concatenating subwords of the $w_n$ as given by
  the integers: the resulting word is
  \[
    (w_0)_{i_0} \ldots (w_0)_{i_1-1} (w_1)_{i_1} \ldots (w_1)_{i_2-1} \ldots
  \]
  We prepare the field by proving some trivial facts about such sequences of
  indexes.


definition idx_sequence :: "nat word  bool"
  where "idx_sequence idx  (idx 0 = 0)  (n. idx n < idx (Suc n))"

lemma idx_sequence_less:
  assumes iseq: "idx_sequence idx"
  shows "idx n < idx (Suc(n+k))"
proof (induct k)
  from iseq show "idx n < idx (Suc (n + 0))"
    by (simp add: idx_sequence_def)
next
  fix k
  assume ih: "idx n < idx (Suc(n+k))"
  from iseq have "idx (Suc(n+k)) < idx (Suc(n + Suc k))"
    by (simp add: idx_sequence_def)
  with ih show "idx n < idx (Suc(n + Suc k))"
    by (rule less_trans)
qed

lemma idx_sequence_inj:
  assumes iseq: "idx_sequence idx"
    and eq: "idx m = idx n"
  shows "m = n"
proof (cases m n rule: linorder_cases)
  case greater
  then obtain k where "m = Suc(n+k)"
    by (auto simp add: less_iff_Suc_add)
  with iseq have "idx n < idx m"
    by (simp add: idx_sequence_less)
  with eq show ?thesis
    by simp
next
  case less
  then obtain k where "n = Suc(m+k)"
    by (auto simp add: less_iff_Suc_add)
  with iseq have "idx m < idx n"
    by (simp add: idx_sequence_less)
  with eq show ?thesis
    by simp
qed

lemma idx_sequence_mono:
  assumes iseq: "idx_sequence idx"
    and m: "m  n"
  shows "idx m  idx n"
proof (cases "m=n")
  case True
  thus ?thesis by simp
next
  case False
  with m have "m < n" by simp
  then obtain k where "n = Suc(m+k)"
    by (auto simp add: less_iff_Suc_add)
  with iseq have "idx m < idx n"
    by (simp add: idx_sequence_less)
  thus ?thesis by simp
qed

text 
  Given an index sequence, every natural number is contained in the
  interval defined by two adjacent indexes, and in fact this interval
  is determined uniquely.


lemma idx_sequence_idx:
  assumes "idx_sequence idx"
  shows "idx k  {idx k ..< idx (Suc k)}"
using assms by (auto simp add: idx_sequence_def)

lemma idx_sequence_interval:
  assumes iseq: "idx_sequence idx"
  shows "k. n  {idx k ..< idx (Suc k) }"
    (is "?P n" is "k. ?in n k")
proof (induct n)
  from iseq have "0 = idx 0"
    by (simp add: idx_sequence_def)
  moreover
  from iseq have "idx 0  {idx 0 ..< idx (Suc 0) }"
    by (rule idx_sequence_idx)
  ultimately
  show "?P 0" by auto
next
  fix n
  assume "?P n"
  then obtain k where k: "?in n k" ..
  show "?P (Suc n)"
  proof (cases "Suc n < idx (Suc k)")
    case True
    with k have "?in (Suc n) k"
      by simp
    thus ?thesis ..
  next
    case False
    with k have "Suc n = idx (Suc k)"
      by auto
    with iseq have "?in (Suc n) (Suc k)"
      by (simp add: idx_sequence_def)
    thus ?thesis ..
  qed
qed

lemma idx_sequence_interval_unique:
  assumes iseq: "idx_sequence idx"
    and k: "n  {idx k ..< idx (Suc k)}"
    and m: "n  {idx m ..< idx (Suc m)}"
  shows "k = m"
proof (cases k m rule: linorder_cases)
  case less
  hence "Suc k  m" by simp
  with iseq have "idx (Suc k)  idx m"
    by (rule idx_sequence_mono)
  with m have "idx (Suc k)  n"
    by auto
  with k have "False"
    by simp
  thus ?thesis ..
next
  case greater
  hence "Suc m  k" by simp
  with iseq have "idx (Suc m)  idx k"
    by (rule idx_sequence_mono)
  with k have "idx (Suc m)  n"
    by auto
  with m have "False"
    by simp
  thus ?thesis ..
qed

lemma idx_sequence_unique_interval:
  assumes iseq: "idx_sequence idx"
  shows "∃! k. n  {idx k ..< idx (Suc k) }"
proof (rule ex_ex1I)
  from iseq show "k. n  {idx k ..< idx (Suc k)}"
    by (rule idx_sequence_interval)
next
  fix k y
  assume "n  {idx k..<idx (Suc k)}" and "n  {idx y..<idx (Suc y)}"
  with iseq show "k = y" by (auto elim: idx_sequence_interval_unique)
qed

text 
  Now we can define the piecewise construction of a word using
  an index sequence.


definition merge :: "'a word word  nat word  'a word"
  where "merge ws idx  λn. let i = THE i. n  {idx i ..< idx (Suc i) } in ws i n"

lemma merge:
  assumes idx: "idx_sequence idx"
    and n: "n  {idx i ..< idx (Suc i)}"
  shows "merge ws idx n = ws i n"
proof -
  from n have "(THE k. n  {idx k ..< idx (Suc k) }) = i"
    by (rule the_equality[OF _ sym[OF idx_sequence_interval_unique[OF idx n]]]) simp
  thus ?thesis
    by (simp add: merge_def Let_def)
qed

lemma merge0:
  assumes idx: "idx_sequence idx"
  shows "merge ws idx 0 = ws 0 0"
proof (rule merge[OF idx])
  from idx have "idx 0 < idx (Suc 0)"
    unfolding idx_sequence_def by blast
  with idx show "0  {idx 0 ..< idx (Suc 0)}"
    by (simp add: idx_sequence_def)
qed

lemma merge_Suc:
  assumes idx: "idx_sequence idx"
    and n: "n  {idx i ..< idx (Suc i)}"
  shows "merge ws idx (Suc n) = (if Suc n = idx (Suc i) then ws (Suc i) else ws i) (Suc n)"
proof auto
  assume eq: "Suc n = idx (Suc i)"
  from idx have "idx (Suc i) < idx (Suc(Suc i))"
    unfolding idx_sequence_def by blast
  with eq idx show "merge ws idx (idx (Suc i)) = ws (Suc i) (idx (Suc i))"
    by (simp add: merge)
next
  assume neq: "Suc n  idx (Suc i)"
  with n have "Suc n  {idx i ..< idx (Suc i) }"
    by auto
  with idx show "merge ws idx (Suc n) = ws i (Suc n)"
    by (rule merge)
qed

end