Theory NN_Layers_Main

(***********************************************************************************
 * Copyright (c) University of Exeter, UK
 *
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 * * Redistributions of source code must retain the above copyright notice, this
 *
 * * Redistributions in binary form must reproduce the above copyright notice,
 *   this list of conditions and the following disclaimer in the documentation
 *   and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 * SPDX-License-Identifier: BSD-2-Clause
 ***********************************************************************************)

section‹Main Theory (Layers)›
theory
  NN_Layers_Main
  imports
   NN_Common 
   Activation_Functions
   NN_Digraph_Layers
   NN_Layers_List_Main
   NN_Layers_Matrix_Main

begin
text‹\label{thy:NN_Layers_Main}›

subsection‹Converting between List-based and Matrix-based Sequential Layer Models ›
fun layer_list_to_matrix::‹('a list, 'b, 'a list list) layer ⇒ ('a Matrix.vec, 'b, 'a Matrix.mat) layer›
  where 
    ‹layer_list_to_matrix (In l)  = (In l)›
  | ‹layer_list_to_matrix (Out l) = (Out l)›
  | ‹layer_list_to_matrix (Activation l) = (Activation ⦇name = name l, units = units l, φ = φ l⦈)›
  | ‹layer_list_to_matrix (Dense l) = (let dimc = length (List.hd (ω l)) in 
                                     (Dense ⦇name = name l, units = units l, φ = φ l, 
                                     β = vec_of_list (β l), ω = transpose_mat (mat_of_rows_list dimc (ω l)) ⦈))›

fun 
  layer_matrix_to_list::‹('a Matrix.vec, 'b, 'a Matrix.mat) layer ⇒ ('a list, 'b, 'a list list) layer›
  where 
    ‹layer_matrix_to_list (In l)  = (In l)›
  | ‹layer_matrix_to_list (Out l) = (Out l)›
  | ‹layer_matrix_to_list (Activation l) = (Activation ⦇name = name l, units = units l, φ = φ l⦈)›
  | ‹layer_matrix_to_list (Dense l) = (Dense ⦇name = name l, units = units l, φ = φ l, 
                                     β = list_of_vec (β l), ω = mat_to_list (transpose_mat  (ω l)) ⦈)›


definition activation_list_to_matrix:: ‹('b ⇒ (('a list ⇒ 'a list ) option)) ⇒ ('b ⇒ (('a Matrix.vec ⇒ 'a Matrix.vec ) option))›
  where 
    "activation_list_to_matrix a = map_option (λ f . vec_of_list ∘ f ∘ list_of_vec ) ∘ a"

definition activation_matrix_to_list:: ‹('b ⇒ (('a Matrix.vec ⇒ 'a Matrix.vec ) option)) ⇒ ('b ⇒ (('a list ⇒ 'a list ) option))›
  where 
    "activation_matrix_to_list a = map_option (λ f . list_of_vec ∘ f ∘ vec_of_list ) ∘ a"

definition 
  nn_list_to_matrix::"('a list, 'b, 'a list list) neural_network_seq_layers ⇒ ('a Matrix.vec, 'b, 'a mat) neural_network_seq_layers"
  where
    ‹nn_list_to_matrix N = ⦇layers = map layer_list_to_matrix (layers N),
                          activation_tab = activation_list_to_matrix (activation_tab N)⦈›

definition 
  nn_matrix_to_list::"('a Matrix.vec, 'b, 'a mat) neural_network_seq_layers ⇒ ('a list, 'b, 'a list list) neural_network_seq_layers"
  where
    ‹nn_matrix_to_list N = ⦇layers = map layer_matrix_to_list (layers N),
                          activation_tab = activation_matrix_to_list (activation_tab N)⦈›

subsection‹Converting Between List/Matrix-based Representations Preserves Consistency›

lemma layer_list_matrix_inverse: 
  ‹layer_consistent⇩_l N n  l ⟹ layer_matrix_to_list (layer_list_to_matrix l) = l›
proof(induction "l")
  case (In x)
  then show ?case by simp 
next
  case (Out x)
  then show ?case by simp
next
  case (Dense x)  note i = this
  then show ?case  
    apply(simp add:list_vec)
    apply(subst mat_list[of "ω x"]) 
     apply (metis empty_iff list.set(1) list.set_sel(1)) 
    by(simp)
next
  case (Activation x)
  then show ?case by simp
qed

lemma layer_list_list_inverse: 
  ‹layer_consistent⇩_m N n  l ⟹ layer_list_to_matrix (layer_matrix_to_list l) = l›
proof(induction "l")
  case (In x)
  then show ?case by simp
next
  case (Out x)
  then show ?case by simp
next
  case (Dense x)  note ii = this                          
  then show ?case 
  proof(cases "∀ c ∈ set (mat_to_list (ω x)⇧^T). dim_row (ω x) = (length c)")
    case True note i = this 
    then show ?thesis proof(cases "mat_to_list (ω x)⇧^T = []")
      case True
      then show ?thesis using i ii  apply(simp add:vec_list Let_def)
        by (metis dim_row_list index_transpose_mat(2) less_nat_zero_code list.size(3))
    next
      case False
      then have ‹dim_row (ω x) = length (List.hd (mat_to_list (ω x)⇧^T))› using i by simp  
      then show ?thesis  using i  
        using i list_mat_transpose_transpose list_mat index_transpose_mat Matrix.transpose_transpose
          list_mat_transpose_transpose[of "ω x", simplified]
        by(simp  add:vec_list)
    qed
  next
    case False
    then show ?thesis  
      by (metis dim_col_mat_list index_transpose_mat(3))
  qed
next
  case (Activation x)
  then show ?case by simp
qed



lemma activation_list_inverse: ‹activation_matrix_to_list (activation_list_to_matrix a) x = a x›
proof(cases "a x = None")
  case True
  then show ?thesis 
    unfolding activation_list_to_matrix_def activation_matrix_to_list_def o_def
    by simp
next
  case False
  then show ?thesis 
    unfolding activation_list_to_matrix_def activation_matrix_to_list_def o_def
    by(auto simp add:list_vec)
qed

lemma activation_list_inverse': ‹activation_matrix_to_list (activation_list_to_matrix a) =a›
  by(rule ext, metis activation_list_inverse)


lemma activation_matrix_inverse: ‹activation_list_to_matrix (activation_matrix_to_list a) x = a x›
proof(cases "a x = None")
  case True
  then show ?thesis 
    unfolding activation_list_to_matrix_def activation_matrix_to_list_def o_def
    by simp
next
  case False
  then show ?thesis 
    unfolding activation_list_to_matrix_def activation_matrix_to_list_def o_def
    by(auto simp add:vec_list)
qed

lemma activation_matrix_inverse': ‹activation_list_to_matrix (activation_matrix_to_list a) = a›
  by(rule ext, metis activation_matrix_inverse)

lemma is_In_seq_l_eq_m:
  assumes ‹(layers N) ≠ []› 
  shows ‹isIn (List.hd (layers N)) = isIn (List.hd (layers (nn_list_to_matrix N)))›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis 
  proof(cases layers)
    case Nil
    then show ?thesis using assms i  by simp
  next
    case (Cons a list)
    then show ?thesis 
      using assms i 
      unfolding nn_list_to_matrix_def  
      by(cases a, simp_all)
  qed 
qed

lemma is_Out_seq_l_eq_m:
  assumes ‹(layers N) ≠ []› 
  shows ‹isOut (last (layers N)) = isOut (last (layers (nn_list_to_matrix N)))›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis
     using assms unfolding fields
   proof(induction layers)
     case Nil
     then show ?case by simp
   next
     case (Cons a layers)
     then show ?case 
    unfolding nn_list_to_matrix_def  
      by(cases a, simp_all)
    qed
  qed

lemma is_Internal_seq_l_eq_m:
  assumes ‹(layers N) ≠ []› 
  shows ‹list_all isInternal ((List.tl o butlast) (layers N)) = list_all isInternal ((List.tl o butlast) (layers (nn_list_to_matrix N)))›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis
     using assms unfolding fields
   proof(induction layers)
     case Nil
     then show ?case by simp
   next
     case (Cons x xs)
      
     then show ?case proof(induction xs)
       case Nil
       then show ?case  
         unfolding nn_list_to_matrix_def 
         by simp
     next
       case (Cons a xs)
       then show ?case 
         unfolding nn_list_to_matrix_def  
         by(cases a,  auto split:if_splits)
     qed
   qed
 qed 

lemma valid_activation_tab_seq_l_imp_m:
  ‹valid_activation_tab⇩_l (activation_tab N) ⟹  valid_activation_tab⇩_m (activation_tab (nn_list_to_matrix N))›
  unfolding valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def nn_list_to_matrix_def activation_list_to_matrix_def o_def
  by (simp, smt (verit, del_insts) length_list_of_vec list_vec map_option_eq_Some mem_Collect_eq ran_def) 

lemma layers_consistent_seq_l_imp_m:
  assumes ‹layers_consistent⇩_l N n  (layers N)› 
  shows ‹layers_consistent⇩_m (nn_list_to_matrix N) n  (layers (nn_list_to_matrix N)) ›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis 
    unfolding fields 
  proof(insert assms[simplified fields, simplified], induction "layers" arbitrary:n activation_tab)
    case Nil
    then show ?case   
      unfolding nn_list_to_matrix_def valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def activation_list_to_matrix_def o_def
      by simp   next
    case (Cons a layers)
    then show ?case proof(cases "a") 
      case (In x1) note iii = this
      then show ?thesis   using Cons 
        unfolding In nn_list_to_matrix_def valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def activation_list_to_matrix_def o_def
        apply(simp add: Cons iii nn_list_to_matrix_def activation_list_to_matrix_def o_def)
        using  iii Cons layers_consistent⇩_l_activation_tab_const 
          layers_consistent⇩_m_activation_tab_const neural_network_seq_layers.select_convs(2)
        by metis 
    next
      case (Out x2)
      then show ?thesis using Cons 
        unfolding nn_list_to_matrix_def valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def activation_list_to_matrix_def o_def
        by (simp, metis (mono_tags, lifting) layers_consistent⇩_l_activation_tab_const 
            layers_consistent⇩_m_activation_tab_const neural_network_seq_layers.select_convs(2))
    next
      case (Dense x3) note iii = this
      then show ?thesis 
      proof(cases x3) 
        case (fields name units φ β ω) 
        then show ?thesis using Cons 
          apply(simp add: nn_list_to_matrix_def, safe) 
          subgoal 
            unfolding nn_list_to_matrix_def nn_list_to_matrix_def
            apply(simp add: i Cons iii dim_col_list dim_col_mat_of_row_list dim_row_mat_of_row_list 
                nn_list_to_matrix_def)
            by (smt (verit, ccfv_SIG) activation_list_to_matrix_def list.set_sel(1) list.size(3) not_less_iff_gr_or_eq o_def option.map(2)) 
          subgoal    
            unfolding nn_list_to_matrix_def nn_list_to_matrix_def
            apply(simp add: i Cons iii dim_col_list dim_col_mat_of_row_list dim_row_mat_of_row_list 
                nn_list_to_matrix_def) 
            by (metis  layers_consistent⇩_l_activation_tab_const layers_consistent⇩_m_activation_tab_const 
                neural_network_seq_layers.select_convs(2)) 
          done 
      qed
    next
      case (Activation x4) note iii = this
      then show ?thesis using Cons 
        apply(simp add: nn_list_to_matrix_def) 
        unfolding nn_list_to_matrix_def nn_list_to_matrix_def
        apply(simp add: i  iii dim_col_list dim_col_mat_of_row_list dim_row_mat_of_row_list 
            nn_list_to_matrix_def) 
        by (metis (mono_tags, lifting) activation_list_to_matrix_def layers_consistent⇩_l_activation_tab_const 
            layers_consistent⇩_m_activation_tab_const neural_network_seq_layers.select_convs(2) o_def option.map(2)) 
    qed
  qed
qed

lemma  in_deg_seq_l_eq_m: ‹in_deg_NN N = (in_deg_NN (nn_list_to_matrix N))›
proof(cases "layers N")
  case Nil
  then show ?thesis 
    unfolding in_deg_NN_def nn_list_to_matrix_def by simp
next
  case (Cons a list)
  then show ?thesis 
    unfolding in_deg_NN_def nn_list_to_matrix_def o_def 
    by(cases a, auto split:if_splits)
qed

lemma is_In_seq_m_eq_l:
  assumes ‹(layers N) ≠ []› 
  shows ‹isIn (List.hd (layers N)) = isIn (List.hd (layers (nn_matrix_to_list N)))›
proof(cases "N")
  case (fields layers activation_tab)
  then show ?thesis  
  proof(insert assms, cases layers)
    case Nil
    then show ?thesis using assms unfolding fields by simp  
  next
    case (Cons a list)
    then show ?thesis 
      using assms fields
      unfolding nn_matrix_to_list_def  
      by(cases a, simp_all)
  qed 
qed

lemma is_Out_seq_m_eq_l:
  assumes ‹(layers N) ≠ []› 
  shows ‹isOut (last (layers N)) = isOut (last (layers (nn_matrix_to_list N)))›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis unfolding fields 
  proof(insert assms[simplified fields], induction layers)
    case Nil
    then show ?case by simp 
  next
    case (Cons a layers)
    then show ?case 
      unfolding nn_matrix_to_list_def  
      by(cases a, simp_all)    
  qed
qed

lemma is_Internal_seq_m_eq_l:
  assumes ‹(layers N) ≠ []› 
  shows ‹list_all isInternal ((List.tl o butlast) (layers N)) = list_all isInternal ((List.tl o butlast) (layers (nn_matrix_to_list N)))›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis unfolding fields
  proof(insert assms[simplified fields], induction layers)
    case Nil
    then show ?case using Cons unfolding nn_matrix_to_list_def by simp 
  next
    case (Cons x xs)
    then show ?case
    proof(induction xs)
      case Nil
      then show ?case using Cons unfolding nn_matrix_to_list_def by simp 
    next
      case (Cons a xs)
      then show ?case using Cons unfolding nn_matrix_to_list_def by (cases a, auto split:if_splits) 
    qed
  qed
qed

lemma valid_activation_tab_seq_m_imp_l:
  ‹valid_activation_tab⇩_m (activation_tab N) ⟹  valid_activation_tab⇩_l (activation_tab (nn_matrix_to_list N))›
  unfolding valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def nn_matrix_to_list_def activation_matrix_to_list_def o_def
  by (simp, smt (verit, del_insts) length_list_of_vec list_vec map_option_eq_Some mem_Collect_eq ran_def) 

lemma layers_consistent_seq_m_imp_l:
  assumes ‹layers_consistent⇩_m N n  (layers N)›
  shows ‹  layers_consistent⇩_l (nn_matrix_to_list N) n  (layers (nn_matrix_to_list N)) ›
proof(cases "N")
  case (fields layers activation_tab) note i = this
  then show ?thesis 
    unfolding fields nn_matrix_to_list_def activation_matrix_to_list_def
  proof(insert assms[simplified fields], induction "layers" arbitrary:n activation_tab)
    case Nil
    then show ?case   
      unfolding nn_matrix_to_list_def valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def activation_matrix_to_list_def o_def
      by simp   next
    case (Cons a layers) note ii = this
    then show ?case proof(cases "a") 
      case (In x1) note iii = this
      then show ?thesis using Cons   
        unfolding nn_matrix_to_list_def valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def activation_matrix_to_list_def o_def
        by (simp, metis (mono_tags, lifting) layers_consistent⇩_l_activation_tab_const
            layers_consistent⇩_m_activation_tab_const neural_network_seq_layers.select_convs(2))
    next
      case (Out x2)
      then show ?thesis using Cons
        unfolding nn_matrix_to_list_def valid_activation_tab⇩_l_def valid_activation_tab⇩_m_def activation_matrix_to_list_def o_def
        by (simp, metis (mono_tags, lifting) layers_consistent⇩_l_activation_tab_const 
            layers_consistent⇩_m_activation_tab_const neural_network_seq_layers.select_convs(2))
    next
      case (Dense x3) note iii = this
      then show ?thesis 
      proof(cases x3) 
        case (fields name units φ β ω) 
        then show ?thesis using Cons
          apply(simp add: nn_matrix_to_list_def, safe) 
          subgoal 
            unfolding nn_matrix_to_list_def nn_matrix_to_list_def
            apply(simp add: i ii iii dim_col_list dim_col_mat_of_row_list dim_row_mat_of_row_list 
                nn_matrix_to_list_def) 
            by (metis dim_row_list index_transpose_mat(2))
          subgoal    
            unfolding nn_matrix_to_list_def nn_matrix_to_list_def
            apply(simp add: i ii iii dim_col_list dim_col_mat_of_row_list dim_row_mat_of_row_list 
                nn_matrix_to_list_def) 
            by (metis layers_consistent⇩_l_activation_tab_const layers_consistent⇩_m_activation_tab_const 
                neural_network_seq_layers.select_convs(2)) 
          done 
      qed
    next
      case (Activation x4) note iii = this
      then show ?thesis  using Cons
        apply(simp add: nn_matrix_to_list_def) 
        unfolding nn_matrix_to_list_def nn_matrix_to_list_def
        apply(simp add: i ii iii dim_col_list dim_col_mat_of_row_list dim_row_mat_of_row_list 
            nn_matrix_to_list_def) 
        by (metis layers_consistent⇩_l_activation_tab_const layers_consistent⇩_m_activation_tab_const 
            neural_network_seq_layers.select_convs(2))
    qed
  qed
qed

lemma  in_deg_seq_m_eq_l: ‹in_deg_NN N = (in_deg_NN (nn_matrix_to_list N))›
proof(cases "layers N")
  case Nil
  then show ?thesis 
    unfolding in_deg_NN_def nn_matrix_to_list_def by simp
next
  case (Cons a list)
  then show ?thesis 
    unfolding in_deg_NN_def nn_matrix_to_list_def o_def 
    by(cases a, auto split:if_splits)
qed

theorem neural_network_sequential_l_m: 
  ‹neural_network_sequential_layers⇩_l N ⟹ neural_network_sequential_layers⇩_m (nn_list_to_matrix N)›
  unfolding neural_network_sequential_layers⇩_l_def neural_network_sequential_layers⇩_m_def
  apply(safe)[1]
  subgoal by (metis hd_Nil_eq_last isIn.elims(2) isOut.simps(2) is_In_seq_l_eq_m) 
  subgoal by (metis hd_Nil_eq_last isIn.elims(2) isOut.simps(2) is_Out_seq_l_eq_m) 
  subgoal by (metis hd_Nil_eq_last isIn.elims(2) isOut.simps(2) is_Internal_seq_l_eq_m) 
  subgoal using valid_activation_tab_seq_l_imp_m by blast
  subgoal using layers_consistent_seq_l_imp_m in_deg_seq_l_eq_m by metis
  done 

theorem neural_network_sequential_m_l: 
  ‹neural_network_sequential_layers⇩_m N ⟹ neural_network_sequential_layers⇩_l (nn_matrix_to_list N)›
  unfolding neural_network_sequential_layers⇩_l_def neural_network_sequential_layers⇩_m_def
  apply(safe)[1]
  subgoal by (metis hd_Nil_eq_last isIn.elims(2) isOut.simps(2) is_In_seq_m_eq_l)
  subgoal by (metis hd_Nil_eq_last isIn.elims(2) isOut.simps(2) is_Out_seq_m_eq_l) 
  subgoal by (metis hd_Nil_eq_last isIn.elims(2) isOut.simps(2) is_Internal_seq_m_eq_l) 
  subgoal using valid_activation_tab_seq_m_imp_l by blast
  subgoal using layers_consistent_seq_m_imp_l in_deg_seq_m_eq_l by metis
  done 

lemma matrix_list_inverse:
  assumes ‹layers_consistent⇩_l N n (layers N)› 
  shows ‹nn_matrix_to_list (nn_list_to_matrix N) = N›
proof(cases "N") 
  case (fields layers activation_tab) note i = this
  then show ?thesis 
    unfolding nn_matrix_to_list_def nn_list_to_matrix_def 
    apply(simp add: o_def activation_list_inverse')
    using assms layers_consistent⇩_lAll layer_list_matrix_inverse
    by (metis (no_types, lifting) list.map_ident_strong neural_network_seq_layers.select_convs(1)) 
qed  


lemma list_matrix_inverse:
  assumes ‹layers_consistent⇩_m N n (layers N)› 
  shows ‹nn_list_to_matrix (nn_matrix_to_list N) = N›
proof(cases "N") 
  case (fields layers activation_tab) note i = this
  then show ?thesis 
    unfolding nn_matrix_to_list_def nn_list_to_matrix_def 
    apply(simp add: o_def activation_matrix_inverse')
    using assms layers_consistent⇩_mAll 
    by (metis (no_types, lifting) layer_list_list_inverse list.map_ident_strong neural_network_seq_layers.select_convs(1)) 
qed  

lemma square_nth_nth_id:‹
    ∀ w ∈ set ws. length w = length ws ⟹
    (map (λi. (map (λia. ws ! i ! ia ) [0..<length ws])) [0..<length ws]) = ws
› 
  by (smt (verit, del_insts) in_set_conv_nth length_map map_cong map_nth nth_map) 

lemma nth_map_f: ‹map ((λ i. f(xs ! i))) [0..<length xs] = map f xs›
  by (smt (verit) add_0 diff_zero length_map map_upt_eqI nth_map) 


lemma square_nth_nth_id_f:‹
    ∀ w ∈ set ws. length w = length ws ⟹
    (map (λi. (map (λia. f (ws ! i ! ia) ) [0..<length ws])) [0..<length ws]) = map (map f) ws› 
  using add_0 diff_zero length_map map_upt_eqI nth_map map_eq_conv map_nth nth_map_f[of "map f" ws] square_nth_nth_id[of ws]
  by(smt)

lemma F:‹ length (ws::'a::{comm_ring} list) = length Inputs ⟹ map (λia. ws ! ia * Inputs ! ia) [0..<length Inputs] = map2 (*) Inputs ws›
  by (simp add: map_equality_iff mult.commute) 

lemma list_singleton: ‹length xs = 1 ⟹ ∃ e. xs = [e] ›
  by (simp add: length_Suc_conv) 


lemma activation_list_to_matrix_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some (vs::'a::comm_ring list)) (Activation pl) = 
    map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) ((layer_list_to_matrix (Activation pl)))) ›
  unfolding nn_list_to_matrix_def activation_list_to_matrix_def  
  by(auto simp add: vec_list list_vec split:option.split)

lemma layers_matrix_to_list: 
  ‹(layers (nn_matrix_to_list N)) = map layer_matrix_to_list (layers N)›
  unfolding nn_matrix_to_list_def 
  by(simp)

lemma layers_list_to_matrix: 
  ‹(layers (nn_list_to_matrix N)) = map layer_list_to_matrix (layers N)›
  unfolding nn_list_to_matrix_def 
  by(simp)

lemma layers_list_to_matrix': 
  ‹layers N = l#ls ⟹ (layers (nn_list_to_matrix N)) = (layer_list_to_matrix l)#(map layer_list_to_matrix ls)›
  unfolding nn_list_to_matrix_def 
  by(simp)

lemma layers_list_to_matrix'':
  ‹(layers (nn_list_to_matrix ⦇layers = l # ls, activation_tab = a⦈)) = ((layer_list_to_matrix l)#(map layer_list_to_matrix ls))›
  by (simp add: layers_list_to_matrix') 

lemma layers_list_to_matrix_none: 
  ‹activation_tab N p = None ⟹ (activation_tab (nn_list_to_matrix N)) p  = None›
  unfolding nn_list_to_matrix_def activation_list_to_matrix_def o_def
  by(simp)

lemma layers_list_to_matrix_some: 
  ‹activation_tab N p = Some f ⟹ (activation_tab (nn_list_to_matrix N)) p  = Some (λx. vec_of_list (f (list_of_vec x))) ›
  unfolding nn_list_to_matrix_def activation_list_to_matrix_def o_def
  by(simp)

lemma activation_list_to_matrix: 
  ‹(activation_tab (nn_list_to_matrix N))  = (activation_list_to_matrix (activation_tab N)) ›
  unfolding nn_list_to_matrix_def activation_list_to_matrix_def o_def
  by(simp)

lemma vec_add_list: 
  assumes ‹dim_vec M = length bs›
  shows ‹M + vec_of_list bs = vec_of_list (map2 (+) (list_of_vec M) bs)›
  using assms unfolding plus_vec_def
  apply(simp) 
  by (smt (verit, del_insts) dim_vec dim_vec_of_list eq_vecI index_add_vec(1) index_add_vec(2) index_vec vec_add_list' vec_list vec_of_list_map)

lemma vec_add_list': 
  assumes ‹dim_vec M = dim_vec bs›
  shows ‹M + bs = vec_of_list (map2 (+) (list_of_vec M) (list_of_vec bs))›
  using assms unfolding plus_vec_def
  apply(simp) 
  by (smt (verit, del_insts) dim_vec dim_vec_of_list eq_vecI index_add_vec(1) index_add_vec(2) index_vec vec_add_list' vec_list vec_of_list_map)


lemma list_of_vec_map':
  ‹v = vec_of_list (map ((vec_index) v) [0..<dim_vec v])›
  by (metis list_of_vec_map vec_list) 

lemma mat_list_transpose: 
  assumes ‹0 < dim_row M› and ‹0 < dim_col M›  
  shows ‹(mat_to_list M⇧^T) = List.transpose (mat_to_list M)›
  using assms 
  unfolding transpose_mat_def mat_to_list_def 
  apply(simp)
  unfolding index_mat_def o_def map_fun_def id_def mat_def mk_mat_def
  apply(subst Abs_mat_inverse)
  unfolding mk_mat_def apply(blast)
  by(subst transpose_rectangle, auto)

lemma dim_row_mat_not_zero:
  assumes ‹dim_row M ≠ 0› 
  shows ‹mat_to_list M ≠ []›
  by (metis assms dim_row_list list.size(3)) 

lemma map2_to_map_idx_eq: ‹length xs = length ys ⟹ (map2 (*) xs (ys)) = map (λ i. xs!i * ys!i) [0..< length xs]›
  using map2_map_map map_nth
  by metis 

lemma map2_to_map_idx: ‹(map2 (*) xs (ys)) = map (λ i. xs!i * ys!i) [0..< min (length xs) (length ys)]›
  by (rule nth_equalityI, auto)

lemma length_list_transpose_mat: ‹0 < dim_row M ⟹ 0 < dim_col M  ⟹ length (List.transpose (mat_to_list M)) = dim_col M›
  apply(simp only: mat_list_transpose[symmetric] dim_row_list[symmetric])
  by simp

lemma map_sum_list_idx: ‹
   map (λm. sum_list (map2 (*) m (list_of_vec v))) (List.transpose (mat_to_list M))
 = map (λi. sum_list (map2 (*) ((List.transpose (mat_to_list M))!i) (list_of_vec v))) [0..<length (List.transpose (mat_to_list M))]›
  by (smt (verit, best) map_cong nth_map_f) 

lemma  vec_mult_mat_list: 
  assumes ‹∀as∈set (mat_to_list M). length as = dim_col M›
    and ‹dim_vec v = dim_row M›
    and ‹dim_col M ≠ 0› 
    and ‹dim_row M ≠ 0› 
  shows ‹  (v::'a::comm_ring vec)  ⇩_v* M = vec_of_list (map (λm. sum_list (map2 (*) m (list_of_vec v))) (mat_to_list M⇧^T))›
  apply(insert dim_row_mat_not_zero[of M])
  apply(rule list_of_vec_ext)
  apply(subst vec_list[of v, symmetric])
  apply(subst list_mat[of M, symmetric])
  unfolding mult_vec_mat_def scalar_prod_def
  apply(simp only:vec_of_list_index)
  apply(simp only:vec_list)
  apply(subst col_of_rows_list')
  using assms apply(simp)
  using assms apply(simp)

  unfolding sum_def
  apply(subst comm_monoid_list_set.distinct_set_conv_list[of "(+)" "0" "[0..<dim_vec v]", simplified])
  using sum.comm_monoid_list_set_axioms apply blast
  apply(simp only:sum_list_def[symmetric])
  apply(simp only: list_vec)
  apply(simp only:vec_of_list_index)
  apply(simp add:dim_col_mat_of_row_list)
  using  assms dim_row_list  length_0_conv  
  apply(simp only: map_sum_list_idx)
  apply(subst  map2_to_map_idx)

  apply (rule nth_equalityI)
   apply (simp add: mat_to_list_def)

  apply(simp only: mat_list_transpose)
  using assms length_list_transpose_mat[of M] nth_transpose[of _ "(mat_to_list M)", simplified]
  apply(simp)
  by (simp add: dim_row_list) 

lemma hd_length_inputs: ‹0 < units x3 ⟹
    length (β x3) = units x3 ⟹ length (ω x3) = units x3 ⟹ ∀r∈set (ω x3). length r = length Inputs ⟹ length Inputs = length (List.hd (ω x3))›
  by (metis length_greater_0_conv list.set_sel(1)) 


subsection‹Semantic Equivalence of List-based and Matrix-based Models›
lemma In_l_to_m_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some vs) (In l)  = map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (In l)))› 
  by(simp add:list_vec)

lemma In_l_to_m_eq':
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (In l)) = map_option vec_of_list  (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some vs) (In l)) › 
  by(simp add:list_vec)

lemma Out_l_to_m_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some vs) (Out l) = map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (Out l)))› 
  by(simp add:list_vec)

lemma Out_l_to_m_eq':
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (Out l)) = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some vs) (Out l))› 
  by(simp add:list_vec)

lemma Dense_l_to_m_eq:
  assumes ‹layer_consistent⇩_l N (length vs) (Dense l)›
  shows ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some (vs::'a::comm_ring list)) (Dense l) 
    = map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (Dense l)))› 
proof(cases " activation_tab N (φ l) = None")
  case True
  then show ?thesis by(auto simp add: nn_list_to_matrix_def activation_list_to_matrix_def o_def )
next
  case False
  then show ?thesis 
    using assms
    apply(simp add: nn_list_to_matrix_def activation_list_to_matrix_def o_def)[1]
    apply (simp add: dim_mult_vec_mat dim_row_mat_of_row_list) 
    apply(subst vec_mult_mat_list)
    subgoal by(simp add: dim_col_list)
    subgoal by (simp add: dim_col_mat_of_row_list hd_length_inputs) 
    subgoal by(simp add: dim_row_mat_of_row_list)
    subgoal by(simp add: dim_col_mat_of_row_list, metis gr_implies_not0 hd_in_set length_0_conv)
    subgoal apply(clarsimp simp add:list_vec)
      subgoal apply(subst mat_list)
        subgoal by(metis length_greater_0_conv list.set_sel(1))
        subgoal using list_vec map2_mult_commute map_eq_conv vec_of_list_map 
          apply(clarsimp simp add:o_def)  
          using Matrix_Utils.vec_add_list length_map map2_mult_commute map_eq_conv vec_of_list_map        
          by (smt (verit) dim_col_mat_of_row_list hd_length_inputs) 
        done          
      done 
    done
qed

lemma Dense_l_to_m_eq':
  assumes ‹layer_consistent⇩_l N (length vs) (Dense l)›
  shows ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (Dense l))
       = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some (vs::'a::comm_ring list)) (Dense l))› 
  using Dense_l_to_m_eq
  by (smt (verit) assms not_Some_eq option.simps(8) option.simps(9) vec_list) 




lemma Activation_l_to_m_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some vs) (Activation l) 
 = map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (Activation l)))› 
proof(cases " activation_tab N (φ l) = None")
  case True
  then show ?thesis by(auto simp add: nn_list_to_matrix_def activation_list_to_matrix_def o_def )
next
  case False
  then show ?thesis 
    apply(simp add:list_vec nn_list_to_matrix_def activation_list_to_matrix_def)
    by(simp add: vec_list list_vec split:option.splits)
qed

lemma Activation_l_to_m_eq':
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix N) (Some (vec_of_list vs)) (layer_list_to_matrix (Activation l))
 = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l N (Some vs) (Activation l))›
  by (smt (verit, del_insts) Activation_l_to_m_eq option.exhaust_sel option.map_disc_iff option.map_sel vec_list) 


lemma aux1: ‹
⋀y. l = Dense x3 ⟹
         (⋀Inputs.
             layers_consistent⇩_l ⦇layers = l0, activation_tab = activation_tab'⦈ (length Inputs) layers' ⟹
             foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l ⦇layers = l1, activation_tab = activation_tab'⦈) (Some Inputs) layers' =
             map_option list_of_vec (foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix ⦇layers = l2, activation_tab = activation_tab'⦈)) (Some (vec_of_list Inputs)) (layers (nn_list_to_matrix ⦇layers = layers', activation_tab = a2⦈)))) ⟹
         valid_activation_tab⇩_l activation_tab' ⟹
         0 < units x3 ⟹
         Inputs ≠ [] ⟹
         length (LayerRecord.β x3) = units x3 ⟹
         length (LayerRecord.ω x3) = units x3 ⟹
         ∀r∈set (LayerRecord.ω x3). length r = length Inputs ⟹
         layers_consistent⇩_l ⦇layers = l0, activation_tab = activation_tab'⦈ (units x3) layers' ⟹
         activation_tab' (ActivationRecord.φ x3) = Some y ⟹
         foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l ⦇layers = l1, activation_tab = activation_tab'⦈) (Some (y (map2 (+) (map ((λvs'. ∑(x, y)←vs'. x * y) ∘ zip Inputs) (LayerRecord.ω x3)) (LayerRecord.β x3)))) layers' =
         map_option list_of_vec
          (foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix ⦇layers = l2, activation_tab = activation_tab'⦈)) (Some (vec_of_list (y (map2 (+) (map ((λvs'. ∑(x, y)←vs'. x * y) ∘ zip Inputs) (LayerRecord.ω x3)) (LayerRecord.β x3)))))
            (map layer_list_to_matrix layers')) ›
    proof -
      fix y :: "'a list ⇒ 'a list"
      assume a1: "valid_activation_tab⇩_l activation_tab'"
      assume a2: "length (β x3) = units x3"
      assume a3: "length (ω x3) = units x3"
      assume a4: "activation_tab' (φ x3) = Some y"
      assume a5: "layers_consistent⇩_l ⦇layers = l0, activation_tab = activation_tab'⦈ (units x3) layers'"
      assume a6: "⋀Inputs. layers_consistent⇩_l ⦇layers = l0, activation_tab = activation_tab'⦈ (length Inputs) layers' 
      ⟹ foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l ⦇layers = l1, activation_tab = activation_tab'⦈) (Some Inputs) layers' = map_option list_of_vec (foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix ⦇layers = l2, activation_tab = activation_tab'⦈)) (Some (vec_of_list Inputs)) (layers (nn_list_to_matrix ⦇layers = layers', activation_tab = a2⦈)))"
      have "⋀as. length (y as) = length as"
        using a4 a1 by (metis (no_types) NN_Layers_List_Main.valid_activation_preserves_length)
      then show "foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l ⦇layers = l1, activation_tab = activation_tab'⦈) (Some (y (map2 (+) (map ((λps. ∑(x, y)←ps. x * y) ∘ zip Inputs) (ω x3)) (β x3)))) layers' = map_option list_of_vec (foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix ⦇layers = l2, activation_tab = activation_tab'⦈)) (Some (vec_of_list (y (map2 (+) (map ((λps. ∑(x, y)←ps. x * y) ∘ zip Inputs) (ω x3)) (β x3))))) (map layer_list_to_matrix layers'))"
        using a6 a5 a3 a2 by (simp add: nn_list_to_matrix_def)
    qed

lemma precdict_seq_l_eq_m':
  assumes ‹layers_consistent⇩_l ⦇layers = l0, activation_tab = activation_tab'⦈ (length (Inputs::'a::comm_ring list)) layers'›
    and ‹valid_activation_tab⇩_l activation_tab'›
  shows ‹foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l ⦇layers = l1, activation_tab = activation_tab'⦈) (Some (Inputs)) (layers ⦇layers = layers', activation_tab =a1⦈) =
    map_option list_of_vec
     (foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m (nn_list_to_matrix ⦇layers = l2, activation_tab = activation_tab'⦈)) (Some (vec_of_list Inputs))
       (layers (nn_list_to_matrix ⦇layers = layers', activation_tab = a2⦈)))›
proof(insert assms, induction "layers'" arbitrary: Inputs)
  case Nil then show ?case 
    unfolding predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m'_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m_def 
      nn_list_to_matrix_def o_def activation_list_to_matrix_def in_deg_NN_def
    by(simp add:list_vec)
next
  case (Cons l layers')
  then show ?case 
  proof(cases l)
    case (In x1)      
    then show ?thesis
      apply(simp add:Cons)
      using Cons
      by ( simp add: layers_list_to_matrix list_vec  fold_predict_l_strict fold_predict_m_strict)
  next
    case (Out x2)
    then show ?thesis
      using Cons
      by ( simp add: layers_list_to_matrix list_vec  fold_predict_l_strict fold_predict_m_strict)
  next
    case (Dense x3) note i = this
    then show ?thesis 
      apply(predict_layer add:layers_list_to_matrix)
      apply(subst Dense_l_to_m_eq')
      using Cons.prems(1) layers_consistent⇩_l.simps(2) apply(simp)  
      using Cons.IH  Cons.prems(1) assms(2) 
      apply(simp) 
      using aux1  
      by (smt (verit) F NN_Layers_List_Main.valid_activation_preserves_length layers_list_to_matrix length_map length_upt list.map_comp
          neural_network_seq_layers.simps(1) option.simps(5,9) verit_minus_simplify(2))
  next
    case (Activation x4)
    then show ?thesis 
      apply(predict_layer add:layers_list_to_matrix)
      apply(subst Activation_l_to_m_eq')
      using Cons.IH Cons.prems(1) assms(2) 
      apply(simp)
      by (metis (mono_tags, lifting) NN_Layers_List_Main.valid_activation_preserves_length layers_list_to_matrix
          neural_network_seq_layers.select_convs(1) option.simps(5,9))
  qed
qed


theorem precdict_seq_l_eq_m:
  assumes ‹layers_consistent⇩_l N (length Inputs) (layers N)› 
    and ‹valid_activation_tab⇩_l (activation_tab N)›
  shows ‹predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l  N (Inputs::'a::comm_ring list) = predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m' (nn_list_to_matrix N) Inputs›
proof(cases "N")
  case (fields layers activation_tab)
  then show ?thesis 
    using assms
    apply(simp)
    unfolding predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m'_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m_def
    by(subst precdict_seq_l_eq_m', simp_all)
qed

lemma In_m_to_l_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some vs) (In l)  = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (In l)))› 
  by(simp add:vec_list)

lemma In_m_to_l_eq':
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (In l)) = map_option list_of_vec  (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some vs) (In l)) › 
  by(simp add:vec_list)

lemma Out_m_to_l_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some vs) (Out l)  = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (Out l)))› 
  by(simp add:vec_list)

lemma Out_m_to_l_eq':
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (In l)) = map_option list_of_vec  (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some vs) (Out l)) › 
  by(simp add:vec_list)

lemma Dense_m_to_l_eq:
  assumes ‹layer_consistent⇩_m N (dim_vec vs) (Dense l)›
  shows ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some (vs::'a::comm_ring Matrix.vec)) (Dense l) 
    = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (Dense l)))› 
proof(cases " activation_tab N (φ l) = None")
  case True
  then show ?thesis by(auto simp add: nn_matrix_to_list_def activation_matrix_to_list_def o_def )
next
  case False
  then show ?thesis 
    apply(clarsimp simp add: nn_matrix_to_list_def activation_matrix_to_list_def o_def)[1]
    subgoal using assms
      apply(simp add: nn_matrix_to_list_def activation_matrix_to_list_def o_def)[1]
      apply(subst vec_add_list')
       apply (simp add: dim_mult_vec_mat dim_row_mat_of_row_list) 
      apply(simp)
      apply(subst vec_mult_mat_list)
      subgoal by(simp add: dim_col_list)
      subgoal by(simp add: dim_col_mat_of_row_list hd_length_inputs)
      subgoal by(simp add: dim_row_mat_of_row_list)
      subgoal by(auto simp add: dim_col_mat_of_row_list)
      subgoal apply(simp add:list_vec map2_mult_commute vec_list list_mat_transpose_transpose)         
        by (smt (z3) Matrix_Utils.vec_add_list dim_col_mat_list dim_vec_of_list index_map_vec(2) index_transpose_mat(3)
            length_list_transpose_mat mat_list_transpose nat_neq_iff vec_list vec_of_dim_0 vec_of_list_map zero_vec_zero)  
      done
    done 
qed

lemma Dense_m_to_l_eq':
  assumes ‹layer_consistent⇩_m N (dim_vec vs) (Dense l)›
  shows ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (Dense l))
       = map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some (vs::'a::comm_ring Matrix.vec)) (Dense l))› 
  using Dense_m_to_l_eq
  by (smt (verit) assms not_Some_eq option.simps(8) option.simps(9) list_vec) 

lemma Activation_m_to_l_eq:
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some vs) (Activation l) 
 = map_option vec_of_list (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (Activation l)))› 
proof(cases " activation_tab N (φ l) = None")
  case True
  then show ?thesis by(auto simp add: nn_matrix_to_list_def activation_matrix_to_list_def o_def )
next
  case False
  then show ?thesis 
    apply(simp add:list_vec nn_matrix_to_list_def activation_matrix_to_list_def)
    by(simp add: vec_list list_vec split:option.splits)
qed

lemma Activation_m_to_l_eq':
  ‹predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list N) (Some (list_of_vec vs)) (layer_matrix_to_list (Activation l))
 = map_option list_of_vec (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m N (Some vs) (Activation l))›
  by (smt (verit, del_insts) Activation_m_to_l_eq option.exhaust_sel option.map_disc_iff option.map_sel list_vec) 

lemma precdict_seq_m_eq_l':
  assumes ‹layers_consistent⇩_m ⦇layers = l0, activation_tab = activation_tab'⦈ (dim_vec (Inputs::'a::comm_ring Matrix.vec)) layers'›
    and ‹valid_activation_tab⇩_m activation_tab'›
  shows ‹foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_m ⦇layers = l1, activation_tab = activation_tab'⦈) (Some (Inputs)) (layers ⦇layers = layers', activation_tab =a1⦈) =
    map_option vec_of_list
     (foldl (predict⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_l (nn_matrix_to_list ⦇layers = l2, activation_tab = activation_tab'⦈)) (Some (list_of_vec Inputs))
       (layers (nn_matrix_to_list ⦇layers = layers', activation_tab = a2⦈)))›
proof(insert assms, induction "layers'" arbitrary: Inputs a)
  case Nil then show ?case 
    unfolding predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m'_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m_def 
      nn_matrix_to_list_def o_def activation_matrix_to_list_def in_deg_NN_def
    by(simp add:vec_list)
next
  case (Cons l layers')
  then show ?case 
  proof(cases l)
    case (In x1)      
    then show ?thesis
      using Cons
      by (auto simp add: layers_matrix_to_list vec_list   fold_predict_l_strict fold_predict_m_strict)
  next
    case (Out x2)
    then show ?thesis
      using Cons
      by (auto simp add: layers_matrix_to_list vec_list  fold_predict_l_strict fold_predict_m_strict)
  next
    case (Dense x3) note i = this
    then show ?thesis 
      apply(predict_layer add:layers_matrix_to_list)
      apply(subst Dense_m_to_l_eq')
      using Cons.prems(1) layers_consistent⇩_m.simps(2) apply(simp)  
      using Cons.IH  Cons.prems(1) assms(2) 
      apply(clarsimp)[1] 
      by (metis (no_types, lifting) index_add_vec(2) layers_matrix_to_list 
          neural_network_seq_layers.select_convs(1) valid_activation_preserves_dim)
  next
    case (Activation x4)
    then show ?thesis 
      apply(predict_layer add:layers_matrix_to_list)
      apply(subst Activation_m_to_l_eq')
      using Cons.IH Cons.prems(1) assms(2) 
      apply(clarsimp)[1]
      by (metis (no_types, lifting) layers_matrix_to_list neural_network_seq_layers.select_convs(1) 
          valid_activation_preserves_dim)
  qed
qed

theorem precdict_seq_m_eq_l:
  assumes ‹layers_consistent⇩_m N (length Inputs) (layers N)› 
    and ‹valid_activation_tab⇩_m (activation_tab N)›
  shows ‹predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m'  N (Inputs::'a::comm_ring list) = predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l (nn_matrix_to_list N) Inputs›
proof(cases "N")
  case (fields layers activation_tab)
  then show ?thesis 
    using assms
    apply(simp)
    unfolding predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m'_def predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m_def
    apply(subst precdict_seq_m_eq_l', simp_all) 
    by (smt (verit, ccfv_threshold) assms(1) layers_consistent_seq_m_imp_l layers_matrix_to_list 
        length_list_of_vec list_matrix_inverse list_vec neural_network_seq_layers.select_convs(2) 
        nn_matrix_to_list_def precdict_seq_l_eq_m' precdict_seq_m_eq_l' valid_activation_tab_seq_m_imp_l) 
qed

corollary precdict_seq_m_eq_l2:
  assumes ‹layers_consistent⇩_m N (dim_vec Inputs) (layers N)› 
    and ‹valid_activation_tab⇩_m (activation_tab N)›
  shows ‹map_option list_of_vec (predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m N Inputs) = predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r_⇩_l (nn_matrix_to_list N) (list_of_vec Inputs)›
  using precdict_seq_m_eq_l predict⇩_s⇩_e⇩_q⇩_{_}⇩_l⇩_a⇩_y⇩_e⇩_r⇩_{_}⇩_m'_def dim_vec_of_list 
  by (metis assms(1) assms(2) vec_list) 
end