random doodling with revCDeriv and dense layers

lecopivo · Oct 4, 2023 · 53e4dc2 · 53e4dc2
1 parent 6652091
commit 53e4dc2
Show file tree

Hide file tree

Showing 2 changed files with 82 additions and 13 deletions.
diff --git a/SciLean/Doodle.lean b/SciLean/Doodle.lean
@@ -1,7 +1,7 @@
-import SciLean.Core.FunctionTransformations.RevCDeriv
-import SciLean.Core.Notation.RevCDeriv
-import SciLean.Core.FloatAsReal
-import SciLean.Util.Limit
+-- import SciLean.Core.FunctionTransformations.RevCDeriv
+-- import SciLean.Core.Notation.RevCDeriv
+-- import SciLean.Core.FloatAsReal
+-- import SciLean.Util.Limit
 
 open SciLean
 

diff --git a/SciLean/Modules/ML/DenseLayer.lean b/SciLean/Modules/ML/DenseLayer.lean
@@ -11,16 +11,84 @@ variable
   {K : Type _} [IsROrC K]
   {W : Type _} [Vec K W]
 
--- set_default_scalar R
+set_default_scalar K
 
-variable {α β κ ι} [Index α] [Index κ] [Index β] [Index ι] [PlainDataType K] [PlainDataType R]
+variable {α β κ ι : Type} [Index α] [Index κ] [Index β] [Index ι] [PlainDataType K] [PlainDataType R]
 
 variable (κ)
-def dense (weights : DataArrayN K (κ×ι)) (bias : DataArrayN K κ) (x : DataArrayN K ι) : DataArrayN K κ := 
-  ⊞ j => ∑ i, weights[(j,i)] * x[i] + bias[j]
+def denseLazy (weights : κ → ι → K) (bias : κ → K) (x : ι → K) (j : κ) : K := 
+  ∑ i, weights j i * x i + bias j
 variable {κ}
 
 
+#generate_revCDeriv denseLazy weights bias x
+  prop_by unfold denseLazy; fprop
+  trans_by unfold denseLazy; ftrans
+
+#generate_revCDeriv denseLazy weights bias x | j
+  prop_by unfold denseLazy; fprop
+  trans_by unfold denseLazy; ftrans; simp (config := {zeta:=false}) only [curryN,uncurryN, CurryN.curry, UncurryN.uncurry]; ftrans 
+
+attribute [ftrans] denseLazy.arg_weightsbiasx_j.revCDeriv_rule_def
+-- attribute [ftrans] denseLazy.arg_weightsbiasx.revCDeriv_rule_def
+
+variable (κ)
+def dense (weights : DataArrayN K (κ×ι)) (bias : K^κ) (x : K^ι) : K^κ := 
+  -- ⊞ j => ∑ i, weights[(j,i)] * x[i] + bias[j]
+  ⊞ j => denseLazy κ (fun j i => weights[(j,i)]) (fun j => bias[j]) (fun i => x[i]) j
+variable {κ}
+set_option pp.funBinderTypes true in
+-- set_option trace.Meta.Tactic.fprop.unify true in
+-- set_option trace.Meta.Tactic.fprop.discharge true in
+-- set_option trace.Meta.Tactic.fprop.step true in
+set_option trace.Meta.Tactic.simp.discharge true in
+set_option trace.Meta.Tactic.simp.unify true in
+set_option trace.Meta.Tactic.ftrans.step true in
+#generate_revCDeriv dense weights bias x
+  prop_by unfold dense; fprop
+  trans_by unfold dense; ftrans; ftrans only
+
+
+#eval 0
+
+
+#check denseLazy.arg_weightsbiasx_j.revCDeriv
+
+set_option trace.Meta.Tactic.ftrans.step true
+set_option trace.Meta.Tactic.ftrans.theorems true
+set_option trace.Meta.Tactic.fprop.discharge true
+set_option trace.Meta.Tactic.simp.discharge true
+set_option trace.Meta.Tactic.simp.congr true
+set_option trace.Meta.Tactic.simp.rewrite true
+set_option trace.Meta.Tactic.simp.unify true
+example [SemiInnerProductSpace K W]
+  : <∂ (fun (x : ((W × DataArrayN K (κ × ι)) × K ^ κ) × K ^ ι) (j : κ) =>
+        denseLazy κ (fun (j : κ) (i : ι) => x.fst.fst.snd[(j, i)]) (fun (j : κ) => x.fst.snd[j]) (fun (i : ι) => x.snd[i]) j)
+    =
+    fun _ => 0 := 
+by
+  conv => 
+    lhs
+    ftrans only
+
+
+#check SciLean.denseLazy.arg_weightsbiasx_j.revCDeriv_rule_def
+#check SciLean.denseLazy.arg_weightsbiasx_j.revCDeriv_rule
+#check SciLean.denseLazy.arg_weightsbiasx_j.HasAdjDiff_rule
+
+#exit
+variable {W : Type _} [SemiInnerProductSpace K W]
+
+example (x : W → DataArrayN K ι) (hx : ∀ i, HasAdjDiff K (fun w => (x w)[i]))
+  : HasAdjDiff K x := by fprop
+
+example (x : W → DataArrayN K ι) (i : ι) (hx : HasAdjDiff K x)
+  : HasAdjDiff K fun w => (x w)[i] := by fprop
+
+example (x : W → DataArrayN K ι) (hx : HasAdjDiff K x)
+  : HasAdjDiff K fun w i => (x w)[i] := by fprop
+
+
 -- def foo : Float → DataArrayN Float (Idx 10) := sorry
 
 -- -- set_option maxHeartbeats 10000
@@ -104,7 +172,7 @@ theorem dense.arg_weightsbiasx.IsDifferentiable_rule
   (hweights : IsDifferentiable K weights) (hbias : IsDifferentiable K bias) (hx : IsDifferentiable K x)
   : IsDifferentiable K fun w => dense κ (weights w) (bias w) (x w) :=
 by
-  unfold dense
+  unfold dense; unfold denseLazy
   fprop
 
 
@@ -115,11 +183,11 @@ theorem dense.arg_weightsbiasx.fwdCDeriv_rule
   : (fwdCDeriv K fun w => dense κ (weights w) (bias w) (x w) )
     =
     ((fwdCDeriv K fun w => dense κ (weights w) (bias w) (x w))
-     rewrite_by unfold dense; autodiff) := 
+     rewrite_by unfold dense; unfold denseLazy; autodiff) := 
 by
-  unfold dense
+  unfold dense; unfold denseLazy
   conv => lhs; autodiff
-
+  
 
 set_option trace.Meta.Tactic.ftrans.step true in
 @[ftrans]
@@ -129,7 +197,7 @@ theorem dense.arg_weightsbiasx.revCDeriv_rule  {W : Type} [SemiInnerProductSpace
   : (revCDeriv K fun w => dense κ (weights w) (bias w) (x w) )
     =
     ((revCDeriv K fun w => dense κ (weights w) (bias w) (x w))
-     rewrite_by unfold dense; autodiff; autodiff) := 
+     rewrite_by unfold dense; unfold denseLazy; autodiff; autodiff) := 
 by
   sorry
 
@@ -155,3 +223,4 @@ section denseDerivTest
 
 end denseDerivTest
 
+