typing fixes and notebook updates

thibmonsel · thibmonsel · commit 7e7d1b443e76 · 2024-10-28T16:31:11.000+01:00
diff --git a/diffrax/_delays.py b/diffrax/_delays.py
@@ -18,7 +18,7 @@
 )
 from optimistix._custom_types import Aux, Fn, Y
 
-from ._custom_types import IntScalarLike, RealScalarLike, VF
+from ._custom_types import BoolScalarLike, IntScalarLike, RealScalarLike
 from ._global_interpolation import DenseInterpolation
 from ._local_interpolation import AbstractLocalInterpolation
 from ._term import VectorFieldWrapper
@@ -32,7 +32,7 @@ class _FixedPointState(eqx.Module, strict=True):
 class ModifiedFixedPointIteration(AbstractFixedPointSolver):
     rtol: float
     atol: float
-    implicit_step: bool
+    implicit_step: BoolScalarLike
     max_steps: int = eqx.field(static=True)
     norm: Callable[[PyTree], Scalar] = rms_norm
 
@@ -95,7 +95,7 @@ def postprocess(
 
 
 class Delays(eqx.Module):
-    """Module that incorportes all the information needed for integrating DDEs"""
+    """Module that incorporates all the information needed for integrating DDEs"""
 
     delays: PyTree[Callable]
     initial_discontinuities: Optional[Array] = jnp.array([0.0])
@@ -121,7 +121,7 @@ class HistoryVectorField(eqx.Module):
         - `delays` : DDE's different deviated arguments
     """
 
-    vector_field: VF
+    vector_field: Callable[..., PyTree]
     t0: RealScalarLike
     tprev: RealScalarLike
     tnext: RealScalarLike
diff --git a/diffrax/_integrate.py b/diffrax/_integrate.py
@@ -113,7 +113,7 @@ class State(eqx.Module):
     event_mask: Optional[PyTree[BoolScalarLike]]
     num_dde_implicit_step: IntScalarLike
     num_dde_explicit_step: IntScalarLike
-    discontinuities: Optional[eqxi.MaybeBuffer[Float[Array, " times_plus_1"]]]  # noqa: F821
+    discontinuities: Optional[eqxi.MaybeBuffer[ArrayLike]]  # noqa: F821
     discontinuities_save_index: Optional[IntScalarLike]
     # Output that is .at[].set() updated during the solve (and their indices)
 
@@ -347,7 +347,6 @@ def body_fun_aux(state):
                 state.solver_state,
                 state.made_jump,
             )
-            implicit_step = False
         else:
             min_delay = []
             flat_delays = jtu.tree_leaves(delays.delays)
@@ -423,6 +422,7 @@ def get_struct_dense_info(init_state):
         assert jnp.result_type(keep_step) is jnp.dtype(bool)
         # Finding all of the potential discontinuity roots
         discont_update = False
+        num_dde_explicit_step = num_dde_implicit_step = 0
         if delays is not None:
             #     _part_maybe_find_discontinuity = ft.partial(
             #         maybe_find_discontinuity,
@@ -467,11 +467,11 @@ def get_struct_dense_info(init_state):
 
             # Count the number of steps in DDEs, just for statistical purposes
             num_dde_implicit_step = state.num_dde_implicit_step + (
-                keep_step & implicit_step
-            )
-            num_dde_explicit_step = state.num_dde_explicit_step + (
-                keep_step & jnp.invert(implicit_step)
+                jnp.where(keep_step, 1, 0) & jnp.where(implicit_step, 1, 0)  # type: ignore
             )
+            num_dde_explicit_step = state.num_dde_explicit_step + jnp.where(
+                keep_step, 1, 0
+            ) & jnp.where(jnp.invert(implicit_step), 1, 0)  # type: ignore
 
         assert jnp.result_type(keep_step) is jnp.dtype(bool)
 
@@ -694,7 +694,9 @@ def _outer_cond_fn(cond_fn_i, old_event_value_i):
                 discontinuities = maybe_inplace_delay(
                     discontinuities_save_index + 1, tnext, discontinuities
                 )
-                discontinuities_save_index = discontinuities_save_index + discont_update
+                discontinuities_save_index = discontinuities_save_index + jnp.where(
+                    discont_update, 1, 0
+                )
 
         new_state = State(
             y=y,
@@ -717,8 +719,8 @@ def _outer_cond_fn(cond_fn_i, old_event_value_i):
             event_dense_info=event_dense_info,
             event_values=event_values,
             event_mask=event_mask,
-            num_dde_explicit_step=num_dde_explicit_step,  # type: ignore
-            num_dde_implicit_step=num_dde_implicit_step,  # type: ignore
+            num_dde_explicit_step=num_dde_explicit_step,
+            num_dde_implicit_step=num_dde_implicit_step,
             discontinuities=discontinuities,  # type: ignore
             discontinuities_save_index=discontinuities_save_index,
         )
@@ -932,7 +934,7 @@ def diffeqsolve(
     t0: RealScalarLike,
     t1: RealScalarLike,
     dt0: Optional[RealScalarLike],
-    y0: PyTree[ArrayLike],
+    y0: Union[PyTree[ArrayLike], Callable[[RealScalarLike], PyTree[ArrayLike]]],
     args: PyTree[Any] = None,
     *,
     saveat: SaveAt = SaveAt(t1=True),
diff --git a/examples/dde.ipynb b/examples/dde.ipynb
@@ -102,7 +102,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "In our case we only have 0 since $y\\prime(t=0^{-}) \\neq y\\prime(t=0^{+})$ because $y\\prime(t=0^{+}) = - 2 \\alpha$ and   $y\\prime(t=0^{-}) = 0$.  \n",
+    "In our case we only have 0 since $y^\\prime(t=0^{-}) \\neq y^\\prime(t=0^{+})$ because $y^\\prime(t=0^{+}) = - 2 \\alpha$ and   $y^\\prime(t=0^{-}) = 0$.  \n",
     "We choose $\\tau=1$."
    ]
   },
@@ -169,7 +169,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Integration took in 0.0011103153228759766 seconds.\n"
+      "Integration took in 0.0004780292510986328 seconds.\n"
      ]
     },
     {
@@ -212,7 +212,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Integration took in 0.0009412765502929688 seconds.\n"
+      "Integration took in 0.0006003379821777344 seconds.\n"
      ]
     },
     {
diff --git a/examples/neural_dde.ipynb b/examples/neural_dde.ipynb
@@ -243,7 +243,7 @@
     "    dataset_size=256,\n",
     "    batch_size=128,\n",
     "    lr_strategy=(3e-3,),\n",
-    "    steps_strategy=(120,),\n",
+    "    steps_strategy=(500,),\n",
     "    length_strategy=(1.0,),\n",
     "    width_size=32,\n",
     "    depth=3,\n",
@@ -310,83 +310,38 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Step: 0, Loss: 1.401884913444519, Computation time: 14.423743486404419\n",
-      "Step: 1, Loss: 1.1716960668563843, Computation time: 0.00439143180847168\n",
-      "Step: 2, Loss: 1.244404673576355, Computation time: 0.003352642059326172\n",
-      "Step: 3, Loss: 1.152793049812317, Computation time: 0.0034520626068115234\n",
-      "Step: 4, Loss: 1.2006347179412842, Computation time: 0.0023109912872314453\n",
-      "Step: 5, Loss: 1.134800910949707, Computation time: 0.003433704376220703\n",
-      "Step: 6, Loss: 1.0922808647155762, Computation time: 0.00430607795715332\n",
-      "Step: 7, Loss: 1.0771468877792358, Computation time: 0.0031037330627441406\n",
-      "Step: 8, Loss: 1.1282471418380737, Computation time: 0.0026216506958007812\n",
-      "Step: 9, Loss: 1.0664700269699097, Computation time: 0.0036363601684570312\n",
-      "Step: 10, Loss: 0.9904348254203796, Computation time: 0.0024759769439697266\n",
-      "Step: 11, Loss: 1.0465335845947266, Computation time: 0.002873659133911133\n",
-      "Step: 12, Loss: 1.0017845630645752, Computation time: 0.004104137420654297\n",
-      "Step: 13, Loss: 1.0248370170593262, Computation time: 0.002857208251953125\n",
-      "Step: 14, Loss: 0.9131743311882019, Computation time: 0.0031785964965820312\n",
-      "Step: 15, Loss: 0.9832042455673218, Computation time: 0.003298044204711914\n",
-      "Step: 16, Loss: 0.9668886661529541, Computation time: 0.002664327621459961\n",
-      "Step: 17, Loss: 0.9930294752120972, Computation time: 0.0028023719787597656\n",
-      "Step: 18, Loss: 0.9732811450958252, Computation time: 0.004416465759277344\n",
-      "Step: 19, Loss: 0.9101904630661011, Computation time: 0.0021491050720214844\n",
-      "Step: 20, Loss: 0.9569293260574341, Computation time: 0.003906965255737305\n",
-      "Step: 21, Loss: 1.000235676765442, Computation time: 0.0031125545501708984\n",
-      "Step: 22, Loss: 0.948157787322998, Computation time: 0.0025708675384521484\n",
-      "Step: 23, Loss: 0.9466567039489746, Computation time: 0.003038644790649414\n",
-      "Step: 24, Loss: 0.9593256115913391, Computation time: 0.003378629684448242\n",
-      "Step: 25, Loss: 0.9038560390472412, Computation time: 0.003355264663696289\n",
-      "Step: 26, Loss: 0.9106528162956238, Computation time: 0.0029053688049316406\n",
-      "Step: 27, Loss: 0.8822335004806519, Computation time: 0.0023543834686279297\n",
-      "Step: 28, Loss: 0.8793952465057373, Computation time: 0.002279043197631836\n",
-      "Step: 29, Loss: 0.8758573532104492, Computation time: 0.0025527477264404297\n",
-      "Step: 30, Loss: 0.8163420557975769, Computation time: 0.0034754276275634766\n",
-      "Step: 31, Loss: 0.7726603150367737, Computation time: 0.0041882991790771484\n",
-      "Step: 32, Loss: 0.7940323352813721, Computation time: 0.0024156570434570312\n",
-      "Step: 33, Loss: 0.7175382375717163, Computation time: 0.0027916431427001953\n",
-      "Step: 34, Loss: 0.7028713226318359, Computation time: 0.0023674964904785156\n",
-      "Step: 35, Loss: 0.6886805295944214, Computation time: 0.0023441314697265625\n",
-      "Step: 36, Loss: 0.6005609035491943, Computation time: 0.002215862274169922\n",
-      "Step: 37, Loss: 0.5269209742546082, Computation time: 0.003516674041748047\n",
-      "Step: 38, Loss: 0.4020206332206726, Computation time: 0.0025489330291748047\n",
-      "Step: 39, Loss: 0.3255264461040497, Computation time: 0.0038254261016845703\n",
-      "Step: 40, Loss: 0.3398251533508301, Computation time: 0.0026879310607910156\n",
-      "Step: 41, Loss: 0.23914429545402527, Computation time: 0.0031821727752685547\n",
-      "Step: 42, Loss: 0.14592041075229645, Computation time: 0.002313852310180664\n",
-      "Step: 43, Loss: 0.13987970352172852, Computation time: 0.002420186996459961\n",
-      "Step: 44, Loss: 0.1373867690563202, Computation time: 0.002546548843383789\n",
-      "Step: 45, Loss: 0.16126586496829987, Computation time: 0.0025119781494140625\n",
-      "Step: 46, Loss: 0.11544477194547653, Computation time: 0.0023653507232666016\n",
-      "Step: 47, Loss: 0.061478693038225174, Computation time: 0.0027551651000976562\n",
-      "Step: 48, Loss: 0.042316604405641556, Computation time: 0.0026128292083740234\n",
-      "Step: 49, Loss: 0.09910032153129578, Computation time: 0.0021860599517822266\n",
-      "Step: 50, Loss: 0.08195476979017258, Computation time: 0.0030493736267089844\n",
-      "Step: 51, Loss: 0.036347728222608566, Computation time: 0.0036330223083496094\n",
-      "Step: 52, Loss: 0.04329509660601616, Computation time: 0.002357959747314453\n",
-      "Step: 53, Loss: 0.0774608924984932, Computation time: 0.003058910369873047\n",
-      "Step: 54, Loss: 0.07515737414360046, Computation time: 0.0029230117797851562\n",
-      "Step: 55, Loss: 0.06952822208404541, Computation time: 0.004669904708862305\n",
-      "Step: 56, Loss: 0.04167735204100609, Computation time: 0.004377126693725586\n",
-      "Step: 57, Loss: 0.043842863291502, Computation time: 0.002735614776611328\n",
-      "Step: 58, Loss: 0.06545793265104294, Computation time: 0.003109455108642578\n",
-      "Step: 59, Loss: 0.055285390466451645, Computation time: 0.003002643585205078\n",
-      "Step: 60, Loss: 0.031119057908654213, Computation time: 0.0036330223083496094\n",
-      "Step: 61, Loss: 0.03198694810271263, Computation time: 0.0037326812744140625\n",
-      "Step: 62, Loss: 0.039938874542713165, Computation time: 0.003992319107055664\n",
-      "Step: 63, Loss: 0.045956145972013474, Computation time: 0.0034766197204589844\n",
-      "Step: 64, Loss: 0.03436319902539253, Computation time: 0.0034666061401367188\n",
-      "Step: 65, Loss: 0.025405289605259895, Computation time: 0.003632783889770508\n",
-      "Step: 66, Loss: 0.023711830377578735, Computation time: 0.002114534378051758\n",
-      "Step: 67, Loss: 0.03284265473484993, Computation time: 0.0043947696685791016\n",
-      "Step: 68, Loss: 0.03023228421807289, Computation time: 0.003482341766357422\n",
-      "Step: 69, Loss: 0.021171605214476585, Computation time: 0.0029871463775634766\n",
-      "Step: 70, Loss: 0.017744384706020355, Computation time: 0.003162860870361328\n",
-      "Step: 71, Loss: 0.022380519658327103, Computation time: 0.004060029983520508\n",
-      "Step: 72, Loss: 0.02576189674437046, Computation time: 0.0023908615112304688\n",
-      "Step: 73, Loss: 0.019239962100982666, Computation time: 0.002658367156982422\n",
-      "Step: 74, Loss: 0.016447639092803, Computation time: 0.003663301467895508\n",
-      "Step: 75, Loss: 0.01782667636871338, Computation time: 0.0035588741302490234\n",
-      "Step: 76, Loss: 0.02072978764772415, Computation time: 0.0031981468200683594\n"
+      "Step: 0, Loss: 1.401884913444519, Computation time: 14.241726636886597\n",
+      "Step: 5, Loss: 1.134800910949707, Computation time: 1.192063570022583\n",
+      "Step: 10, Loss: 0.9904348254203796, Computation time: 1.9642481803894043\n",
+      "Step: 15, Loss: 0.9832042455673218, Computation time: 2.6581308841705322\n",
+      "Step: 20, Loss: 0.9569293260574341, Computation time: 3.8219752311706543\n",
+      "Step: 25, Loss: 0.9038560390472412, Computation time: 3.6977927684783936\n",
+      "Step: 30, Loss: 0.8163420557975769, Computation time: 35.42212176322937\n",
+      "Step: 35, Loss: 0.6886805295944214, Computation time: 6.909891843795776\n",
+      "Step: 40, Loss: 0.3398251533508301, Computation time: 5.504199266433716\n",
+      "Step: 45, Loss: 0.16126586496829987, Computation time: 5.103270769119263\n",
+      "Step: 50, Loss: 0.08195476979017258, Computation time: 5.78333044052124\n",
+      "Step: 55, Loss: 0.06952822208404541, Computation time: 10.413585901260376\n",
+      "Step: 60, Loss: 0.031119057908654213, Computation time: 7.735013723373413\n",
+      "Step: 65, Loss: 0.025405289605259895, Computation time: 7.267561912536621\n",
+      "Step: 70, Loss: 0.017744384706020355, Computation time: 6.29371190071106\n",
+      "Step: 75, Loss: 0.01782667636871338, Computation time: 25.47852373123169\n",
+      "Step: 80, Loss: 0.015500097535550594, Computation time: 6.827113628387451\n",
+      "Step: 85, Loss: 0.011661469005048275, Computation time: 7.4889373779296875\n",
+      "Step: 90, Loss: 0.00916498713195324, Computation time: 5.9714484214782715\n",
+      "Step: 95, Loss: 0.010490368120372295, Computation time: 6.338549613952637\n",
+      "Step: 100, Loss: 0.007394495420157909, Computation time: 6.486926078796387\n",
+      "Step: 105, Loss: 0.007423707749694586, Computation time: 7.48775839805603\n",
+      "Step: 110, Loss: 0.007470142096281052, Computation time: 6.819472312927246\n",
+      "Step: 115, Loss: 0.0059195710346102715, Computation time: 6.100851058959961\n",
+      "Step: 120, Loss: 0.005787399597465992, Computation time: 6.755363941192627\n",
+      "Step: 125, Loss: 0.005841915961354971, Computation time: 6.580211639404297\n",
+      "Step: 130, Loss: 0.006159897893667221, Computation time: 6.810395956039429\n",
+      "Step: 135, Loss: 0.0052039725705981255, Computation time: 7.518130779266357\n",
+      "Step: 140, Loss: 0.0053937858901917934, Computation time: 6.242229223251343\n",
+      "Step: 145, Loss: 0.00430111913010478, Computation time: 5.085596799850464\n",
+      "Step: 150, Loss: 0.004397619515657425, Computation time: 5.2558135986328125\n",
+      "Step: 155, Loss: 0.004206538666039705, Computation time: 7.212834596633911\n"
      ]
     }
    ],

Original file line number	Diff line number	Diff line change
`@@ -102,7 +102,7 @@`
`102`	`102`	`"cell_type": "markdown",`
`103`	`103`	`"metadata": {},`
`104`	`104`	`"source": [`
`105`		`- "In our case we only have 0 since $y\\prime(t=0^{-}) \\neq y\\prime(t=0^{+})$ because $y\\prime(t=0^{+}) = - 2 \\alpha$ and $y\\prime(t=0^{-}) = 0$. \n",`
	`105`	`+ "In our case we only have 0 since $y^\\prime(t=0^{-}) \\neq y^\\prime(t=0^{+})$ because $y^\\prime(t=0^{+}) = - 2 \\alpha$ and $y^\\prime(t=0^{-}) = 0$. \n",`
`106`	`106`	`"We choose $\\tau=1$."`
`107`	`107`	`]`
`108`	`108`	`},`
`@@ -169,7 +169,7 @@`
`169`	`169`	`"name": "stdout",`
`170`	`170`	`"output_type": "stream",`
`171`	`171`	`"text": [`
`172`		`- "Integration took in 0.0011103153228759766 seconds.\n"`
	`172`	`+ "Integration took in 0.0004780292510986328 seconds.\n"`
`173`	`173`	`]`
`174`	`174`	`},`
`175`	`175`	`{`
`@@ -212,7 +212,7 @@`
`212`	`212`	`"name": "stdout",`
`213`	`213`	`"output_type": "stream",`
`214`	`214`	`"text": [`
`215`		`- "Integration took in 0.0009412765502929688 seconds.\n"`
	`215`	`+ "Integration took in 0.0006003379821777344 seconds.\n"`
`216`	`216`	`]`
`217`	`217`	`},`
`218`	`218`	`{`