Fixes for investment lecture (#122)

jstac · web-flow · commit 5bab20e2e85e · 2023-09-22T10:16:29.000+10:00
* misc

* misc

* misc

* misc

* misc
diff --git a/lectures/opt_invest.md b/lectures/opt_invest.md
@@ -25,8 +25,7 @@ We require the following library to be installed.
 !pip install --upgrade quantecon
 ```
 
-A monopolist faces inverse demand
-curve
+We study a monopolist who faces inverse demand curve
 
 $$
 P_t = a_0 - a_1 Y_t + Z_t,
@@ -38,7 +37,7 @@ where
 * $Y_t$ is output and
 * $Z_t$ is a demand shock.
 
-We assume that $Z_t$ is a discretized AR(1) process.
+We assume that $Z_t$ is a discretized AR(1) process, specified below.
 
 Current profits are
 
@@ -116,10 +115,10 @@ def create_investment_model(
 
 
 Let's re-write the vectorized version of the right-hand side of the
-Bellman equation (before maximization), which is a 3D array representing:
+Bellman equation (before maximization), which is a 3D array representing
 
 $$
-  B(y, z, y') = r(y, z, y') + \beta \sum_{z'} v(y', z') Q(z, z')
+    B(y, z, y') = r(y, z, y') + \beta \sum_{z'} v(y', z') Q(z, z')
 $$
 
 for all $(y, z, y')$.
@@ -154,8 +153,10 @@ def B(v, constants, sizes, arrays):
 B = jax.jit(B, static_argnums=(2,))
 ```
 
+We define a function to compute the current rewards $r_\sigma$ given policy $\sigma$,
+which is defined as the vector
 
-Define a function to compute the current rewards given policy $\sigma$.
+$$ r_\sigma(y, z) := r(y, z, \sigma(y, z)) $$
 
 ```{code-cell} ipython3
 def compute_r_σ(σ, constants, sizes, arrays):
@@ -238,47 +239,32 @@ T_σ = jax.jit(T_σ, static_argnums=(3,))
 
 Next, we want to computes the lifetime value of following policy $\sigma$.
 
-The basic problem is to solve the linear system
+This lifetime value is a function $v_\sigma$ that satisfies
 
-$$ v(y, z) = r(y, z, \sigma(y, z)) + \beta \sum_{z'} v(\sigma(y, z), z') Q(z, z) $$
+$$ v_\sigma(y, z) = r_\sigma(y, z) + \beta \sum_{z'} v_\sigma(\sigma(y, z), z') Q(z, z') $$
 
-for $v$.
+We wish to solve this equation for $v_\sigma$.
 
-It turns out to be helpful to rewrite this as
+Suppose we define the linear operator $L_\sigma$ by
 
-$$ v(y, z) = r(y, z, \sigma(y, z)) + \beta \sum_{y', z'} v(y', z') P_\sigma(y, z, y', z') $$
+$$ (L_\sigma v)(y, z) = v(y, z) - \beta \sum_{z'} v(\sigma(y, z), z') Q(z, z') $$
 
-where $P_\sigma(y, z, y', z') = 1\{y' = \sigma(y, z)\} Q(z, z')$.
-
-We want to write this as $v = r_\sigma + \beta P_\sigma v$ and then solve for $v$
-
-Note, however, that $v$ is a multi-index array, rather than a vector.
-
-
-The value $v_{\sigma}$ of a policy $\sigma$ is defined as
+With this notation, the problem is to solve for $v$ via
 
 $$
-        v_{\sigma} = (I - \beta P_{\sigma})^{-1} r_{\sigma}
+    (L_{\sigma} v)(y, z) = r_\sigma(y, z)
 $$
 
-Here we set up the linear map $v \mapsto R_{\sigma} v$,
-
-where $R_{\sigma} := I - \beta P_{\sigma}$
-
-In the investment problem, this map can be expressed as
-
-$$
-    (R_{\sigma} v)(y, z) = v(y, z) - \beta \sum_{z'} v(\sigma(y, z), z') Q(z, z')
-$$
+In vector for this is $L_\sigma v = r_\sigma$, which tells us that the function
+we seek is
 
-Defining the map as above works in a more intuitive multi-index setting
-(e.g. working with $v[i, j]$ rather than flattening v to a one-dimensional
-array) and avoids instantiating the large matrix $P_{\sigma}$.
+$$ v_\sigma = L_\sigma^{-1} r_\sigma $$
 
-Let's define the function $R_{\sigma}$.
+JAX allows us to solve linear systems defined in terms of operators; the first
+step is to define the function $L_{\sigma}$.
 
 ```{code-cell} ipython3
-def R_σ(v, σ, constants, sizes, arrays):
+def L_σ(v, σ, constants, sizes, arrays):
 
     β, a_0, a_1, γ, c = constants
     y_size, z_size = sizes
@@ -296,12 +282,11 @@ def R_σ(v, σ, constants, sizes, arrays):
     # Compute and return v[i, j] - β Σ_jp v[σ[i, j], jp] * Q[j, jp]
     return v - β * jnp.sum(V * Q, axis=2)
 
-R_σ = jax.jit(R_σ, static_argnums=(3,))
+L_σ = jax.jit(L_σ, static_argnums=(3,))
 ```
 
+Now we can define a function to compute $v_{\sigma}$ 
 
-Define a function to get the value $v_{\sigma}$ of policy
-$\sigma$ by inverting the linear map $R_{\sigma}$.
 
 ```{code-cell} ipython3
 def get_value(σ, constants, sizes, arrays):
@@ -313,16 +298,16 @@ def get_value(σ, constants, sizes, arrays):
 
     r_σ = compute_r_σ(σ, constants, sizes, arrays)
 
-    # Reduce R_σ to a function in v
-    partial_R_σ = lambda v: R_σ(v, σ, constants, sizes, arrays)
+    # Reduce L_σ to a function in v
+    partial_L_σ = lambda v: L_σ(v, σ, constants, sizes, arrays)
 
-    return jax.scipy.sparse.linalg.bicgstab(partial_R_σ, r_σ)[0]
+    return jax.scipy.sparse.linalg.bicgstab(partial_L_σ, r_σ)[0]
 
 get_value = jax.jit(get_value, static_argnums=(2,))
 ```
 
 
-Now we define the solvers, which implement VFI, HPI and OPI.
+Finally, we introduce the solvers that implement VFI, HPI and OPI.
 
 ```{code-cell} ipython3
 :load: _static/lecture_specific/vfi.py
@@ -396,7 +381,7 @@ plt.show()
 Let's plot the time taken by each of the solvers and compare them.
 
 ```{code-cell} ipython3
-m_vals = range(5, 3000, 100)
+m_vals = range(5, 600, 40)
 ```
 
 ```{code-cell} ipython3
diff --git a/lectures/opt_savings.md b/lectures/opt_savings.md
@@ -133,7 +133,14 @@ def B(v, constants, sizes, arrays):
 
 ## Operators
 
-Now we define the policy operator $T_\sigma$
+
+We define a function to compute the current rewards $r_\sigma$ given policy $\sigma$,
+which is defined as the vector
+
+
+$$ r_\sigma(w, y) := r(w, y, \sigma(w, y)) $$
+
+
 
 ```{code-cell} ipython3
 def compute_r_σ(σ, constants, sizes, arrays):
@@ -157,6 +164,8 @@ def compute_r_σ(σ, constants, sizes, arrays):
     return r_σ
 ```
 
+Now we define the policy operator $T_\sigma$
+
 ```{code-cell} ipython3
 def T_σ(v, σ, constants, sizes, arrays):
     "The σ-policy operator."
@@ -201,47 +210,36 @@ def get_greedy(v, constants, sizes, arrays):
 
 The function below computes the value $v_\sigma$ of following policy $\sigma$.
 
-The basic problem is to solve the linear system
-
-$$ v(w,y ) = u(Rw + y - \sigma(w, y)) + β \sum_{y'} v(\sigma(w, y), y') Q(y, y) $$
+This lifetime value is a function $v_\sigma$ that satisfies
 
-for $v$.
+$$ v_\sigma(w, y) = r_\sigma(w, y) + \beta \sum_{y'} v_\sigma(\sigma(w, y), y') Q(y, y') $$
 
-It turns out to be helpful to rewrite this as
+We wish to solve this equation for $v_\sigma$.
 
-$$ v(w,y) = r(w, y, \sigma(w, y)) + β \sum_{w', y'} v(w', y') P_\sigma(w, y, w', y') $$
+Suppose we define the linear operator $L_\sigma$ by
 
-where $P_\sigma(w, y, w', y') = 1\{w' = \sigma(w, y)\} Q(y, y')$.
+$$ (L_\sigma v)(w, y) = v(w, y) - \beta \sum_{y'} v(\sigma(w, y), y') Q(y, y') $$
 
-We want to write this as $v = r_\sigma + P_\sigma v$ and then solve for $v$
+With this notation, the problem is to solve for $v$ via
 
-Note, however,
+$$
+    (L_{\sigma} v)(w, y) = r_\sigma(w, y)
+$$
 
-* $v$ is a 2 index array, rather than a single vector.
-* $P_\sigma$ has four indices rather than 2
+In vector for this is $L_\sigma v = r_\sigma$, which tells us that the function
+we seek is
 
-The code below
+$$ v_\sigma = L_\sigma^{-1} r_\sigma $$
 
-1. reshapes $v$ and $r_\sigma$ to 1D arrays and $P_\sigma$ to a matrix
-2. solves the linear system
-3. converts back to multi-index arrays.
+JAX allows us to solve linear systems defined in terms of operators; the first
+step is to define the function $L_{\sigma}$.
 
 ```{code-cell} ipython3
-def R_σ(v, σ, constants, sizes, arrays):
+def L_σ(v, σ, constants, sizes, arrays):
     """
-    The value v_σ of a policy σ is defined as
-
-        v_σ = (I - β P_σ)^{-1} r_σ
-
-    Here we set up the linear map v -> R_σ v, where R_σ := I - β P_σ.
+    Here we set up the linear map v -> L_σ v, where 
 
-    In the consumption problem, this map can be expressed as
-
-        (R_σ v)(w, y) = v(w, y) - β Σ_y′ v(σ(w, y), y′) Q(y, y′)
-
-    Defining the map as above works in a more intuitive multi-index setting
-    (e.g. working with v[i, j] rather than flattening v to a one-dimensional
-    array) and avoids instantiating the large matrix P_σ.
+        (L_σ v)(w, y) = v(w, y) - β Σ_y′ v(σ(w, y), y′) Q(y, y′)
 
     """
 
@@ -262,9 +260,11 @@ def R_σ(v, σ, constants, sizes, arrays):
     return v - β * jnp.sum(V * Q, axis=2)
 ```
 
+Now we can define a function to compute $v_{\sigma}$ 
+
 ```{code-cell} ipython3
 def get_value(σ, constants, sizes, arrays):
-    "Get the value v_σ of policy σ by inverting the linear map R_σ."
+    "Get the value v_σ of policy σ by inverting the linear map L_σ."
 
     # Unpack
     β, R, γ = constants
@@ -273,10 +273,10 @@ def get_value(σ, constants, sizes, arrays):
 
     r_σ = compute_r_σ(σ, constants, sizes, arrays)
 
-    # Reduce R_σ to a function in v
-    partial_R_σ = lambda v: R_σ(v, σ, constants, sizes, arrays)
+    # Reduce L_σ to a function in v
+    partial_L_σ = lambda v: L_σ(v, σ, constants, sizes, arrays)
 
-    return jax.scipy.sparse.linalg.bicgstab(partial_R_σ, r_σ)[0]
+    return jax.scipy.sparse.linalg.bicgstab(partial_L_σ, r_σ)[0]
 ```
 
 ## JIT compiled versions
@@ -288,7 +288,7 @@ T = jax.jit(T, static_argnums=(2,))
 get_greedy = jax.jit(get_greedy, static_argnums=(2,))
 get_value = jax.jit(get_value, static_argnums=(2,))
 T_σ = jax.jit(T_σ, static_argnums=(3,))
-R_σ = jax.jit(R_σ, static_argnums=(3,))
+L_σ = jax.jit(L_σ, static_argnums=(3,))
 ```
 
 ## Solvers
@@ -379,7 +379,7 @@ model = create_consumption_model()
 σ_pi, pi_time = run_algorithm(policy_iteration, model)
 σ_vfi, vfi_time = run_algorithm(value_iteration, model, tol=1e-5)
 
-m_vals = range(5, 3000, 100)
+m_vals = range(5, 600, 40)
 opi_times = []
 for m in m_vals:
     σ_opi, opi_time = run_algorithm(optimistic_policy_iteration, model, m=m, tol=1e-5)