Memory Spaces - Power Iteration - SOLUTION: Fix %timeit synchronization and regenerate output.

brycelelbach · brycelelbach · commit 9265b089fe7c · 2025-08-07T21:04:04.000-07:00
diff --git a/notebooks/5__memory_spaces__power_iteration__SOLUTION.ipynb b/notebooks/5__memory_spaces__power_iteration__SOLUTION.ipynb
@@ -47,7 +47,7 @@
       "metadata": {
         "id": "ZHpg3aVXSeix"
       },
-      "execution_count": null,
+      "execution_count": 1,
       "outputs": []
     },
     {
@@ -78,16 +78,34 @@
       "metadata": {
         "id": "BCToOdVdSONp"
       },
-      "execution_count": null,
+      "execution_count": 2,
       "outputs": []
     },
     {
       "cell_type": "code",
-      "execution_count": null,
+      "execution_count": 3,
       "metadata": {
-        "id": "5ak3mn2hIsKo"
+        "id": "5ak3mn2hIsKo",
+        "outputId": "0d415d45-535a-4a2d-e757-f0c4a7a1efb0",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "outputs": [],
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "[[-0.4937 -0.519  -0.2935 ... -0.1628  0.8361  0.531 ]\n",
+            " [-1.0859  0.0087 -0.0661 ... -0.1706  1.0955  0.7075]\n",
+            " [-0.4291 -0.3628  0.3393 ...  0.1813  0.2238 -0.2124]\n",
+            " ...\n",
+            " [-1.1089 -0.4564 -0.3024 ...  0.2075  1.2864  0.9066]\n",
+            " [-0.8714 -0.5109 -0.1201 ... -0.072   1.3048  0.4372]\n",
+            " [-1.6421 -0.6629 -0.2001 ... -0.2997  1.8579  1.5576]]\n"
+          ]
+        }
+      ],
       "source": [
         "def generate_host(cfg=PowerIterationConfig()):\n",
         "  np.random.seed(42)\n",
@@ -150,10 +168,44 @@
         "print(lam_est_host)"
       ],
       "metadata": {
-        "id": "q0x0_p4pvAdD"
+        "id": "q0x0_p4pvAdD",
+        "outputId": "78e0d606-1d79-4a89-8bcc-79dd9282f4cf",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "execution_count": null,
-      "outputs": []
+      "execution_count": 4,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "step 0: residual = 7.594e+00\n",
+            "step 10: residual = 1.699e-02\n",
+            "step 20: residual = 2.148e-02\n",
+            "step 30: residual = 1.295e-02\n",
+            "step 40: residual = 4.494e-03\n",
+            "step 50: residual = 1.366e-03\n",
+            "step 60: residual = 4.129e-04\n",
+            "step 70: residual = 1.274e-04\n",
+            "step 80: residual = 4.013e-05\n",
+            "step 90: residual = 1.286e-05\n",
+            "step 100: residual = 4.181e-06\n",
+            "step 110: residual = 1.374e-06\n",
+            "step 120: residual = 4.550e-07\n",
+            "step 130: residual = 1.517e-07\n",
+            "step 140: residual = 5.085e-08\n",
+            "step 150: residual = 1.712e-08\n",
+            "step 160: residual = 5.784e-09\n",
+            "step 170: residual = 1.961e-09\n",
+            "step 180: residual = 6.655e-10\n",
+            "step 190: residual = 2.269e-10\n",
+            "step 200: residual = 7.746e-11\n",
+            "\n",
+            "0.9999999999604734\n"
+          ]
+        }
+      ]
     },
     {
       "cell_type": "markdown",
@@ -204,10 +256,44 @@
         "print(lam_est_device)"
       ],
       "metadata": {
-        "id": "sulx6gabBd1w"
+        "id": "sulx6gabBd1w",
+        "outputId": "2b929e25-6bd7-4533-bf93-1a7d1f912f00",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "execution_count": null,
-      "outputs": []
+      "execution_count": 5,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "step 0: residual = 7.594e+00\n",
+            "step 10: residual = 1.699e-02\n",
+            "step 20: residual = 2.148e-02\n",
+            "step 30: residual = 1.295e-02\n",
+            "step 40: residual = 4.494e-03\n",
+            "step 50: residual = 1.366e-03\n",
+            "step 60: residual = 4.129e-04\n",
+            "step 70: residual = 1.274e-04\n",
+            "step 80: residual = 4.013e-05\n",
+            "step 90: residual = 1.286e-05\n",
+            "step 100: residual = 4.181e-06\n",
+            "step 110: residual = 1.374e-06\n",
+            "step 120: residual = 4.550e-07\n",
+            "step 130: residual = 1.517e-07\n",
+            "step 140: residual = 5.085e-08\n",
+            "step 150: residual = 1.712e-08\n",
+            "step 160: residual = 5.784e-09\n",
+            "step 170: residual = 1.960e-09\n",
+            "step 180: residual = 6.659e-10\n",
+            "step 190: residual = 2.269e-10\n",
+            "step 200: residual = 7.736e-11\n",
+            "\n",
+            "0.9999999999593268\n"
+          ]
+        }
+      ]
     },
     {
       "cell_type": "markdown",
@@ -257,10 +343,63 @@
         "print(lam_est_device_generation)"
       ],
       "metadata": {
-        "id": "HXFZXGhU1Xj2"
+        "id": "HXFZXGhU1Xj2",
+        "outputId": "fd52bba4-839b-42c6-c7d3-80d1a39f80e3",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "execution_count": null,
-      "outputs": []
+      "execution_count": 6,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "A_host:\n",
+            "[[-0.4937 -0.519  -0.2935 ... -0.1628  0.8361  0.531 ]\n",
+            " [-1.0859  0.0087 -0.0661 ... -0.1706  1.0955  0.7075]\n",
+            " [-0.4291 -0.3628  0.3393 ...  0.1813  0.2238 -0.2124]\n",
+            " ...\n",
+            " [-1.1089 -0.4564 -0.3024 ...  0.2075  1.2864  0.9066]\n",
+            " [-0.8714 -0.5109 -0.1201 ... -0.072   1.3048  0.4372]\n",
+            " [-1.6421 -0.6629 -0.2001 ... -0.2997  1.8579  1.5576]]\n",
+            "\n",
+            "A_device:\n",
+            "[[-0.3175 -0.227   0.0765 ... -0.2411  0.9861 -0.6663]\n",
+            " [-1.8135 -0.6378 -0.4466 ... -0.4503  3.2291 -1.3058]\n",
+            " [-0.6443  0.3033  0.9719 ...  0.1302  0.4531 -0.3723]\n",
+            " ...\n",
+            " [-1.8697 -0.7714 -0.2048 ...  0.0244  2.859  -1.1147]\n",
+            " [-1.1404 -0.9935 -0.4077 ... -0.2789  2.8553 -0.7879]\n",
+            " [-0.5979 -0.6596  0.1047 ... -0.1826  1.4195 -0.0636]]\n",
+            "\n",
+            "step 0: residual = 2.346e+01\n",
+            "step 10: residual = 2.859e-02\n",
+            "step 20: residual = 2.984e-02\n",
+            "step 30: residual = 1.433e-02\n",
+            "step 40: residual = 5.035e-03\n",
+            "step 50: residual = 1.643e-03\n",
+            "step 60: residual = 5.309e-04\n",
+            "step 70: residual = 1.726e-04\n",
+            "step 80: residual = 5.663e-05\n",
+            "step 90: residual = 1.875e-05\n",
+            "step 100: residual = 6.253e-06\n",
+            "step 110: residual = 2.098e-06\n",
+            "step 120: residual = 7.077e-07\n",
+            "step 130: residual = 2.396e-07\n",
+            "step 140: residual = 8.140e-08\n",
+            "step 150: residual = 2.772e-08\n",
+            "step 160: residual = 9.461e-09\n",
+            "step 170: residual = 3.234e-09\n",
+            "step 180: residual = 1.107e-09\n",
+            "step 190: residual = 3.792e-10\n",
+            "step 200: residual = 1.299e-10\n",
+            "step 210: residual = 4.454e-11\n",
+            "\n",
+            "0.9999999999558278\n"
+          ]
+        }
+      ]
     },
     {
       "cell_type": "markdown",
@@ -282,7 +421,7 @@
       "metadata": {
         "id": "fL7QYIVesehd"
       },
-      "execution_count": null,
+      "execution_count": 7,
       "outputs": []
     },
     {
@@ -313,10 +452,29 @@
         "np.testing.assert_allclose(lam_est_device, lam_ref, rtol=1e-4)"
       ],
       "metadata": {
-        "id": "7E7MUYsYsjwO"
+        "id": "7E7MUYsYsjwO",
+        "outputId": "b9e3bb4e-f9d9-4311-ba18-5896be23eb8e",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "execution_count": null,
-      "outputs": []
+      "execution_count": 8,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Solution\n",
+            "\n",
+            "Power iteration (host)   = 1.000000e+00\n",
+            "Power iteration (device) = 1.000000e+00\n",
+            "`eigvals` reference      = 1.000000e+00\n",
+            "\n",
+            "Relative error (host)    = 3.938e-11\n",
+            "Relative error (device)  = 4.053e-11\n"
+          ]
+        }
+      ]
     },
     {
       "cell_type": "markdown",
@@ -333,22 +491,38 @@
         "print(f\"Execution Time\")\n",
         "print()\n",
         "\n",
-        "time_host = %timeit -q -o estimate_host(A_host, PowerIterationConfig(progress=False))\n",
+        "time_host = %timeit -q -o estimate_host(A_host, PowerIterationConfig(progress=False)).item()\n",
         "print(f\"Power iteration (host)   = {time_host}\")\n",
         "\n",
         "# We intentionally use `A_host`, not `A_device`, because they're not\n",
         "# the same matrices due to differences in NumPy and CuPy's random facilities.\n",
-        "time_device = %timeit -q -o estimate_device(A_host, PowerIterationConfig(progress=False))\n",
+        "time_device = %timeit -q -o estimate_device(A_host, PowerIterationConfig(progress=False)).item()\n",
         "print(f\"Power iteration (device) = {time_device}\")\n",
         "\n",
         "time_ref = %timeit -q -o -r 1 -n 1 np.linalg.eigvals(A_host).real.max()\n",
         "print(f\"`eigvals` reference      = {time_ref}\")"
       ],
       "metadata": {
-        "id": "v_2HmcBFERhE"
+        "id": "v_2HmcBFERhE",
+        "outputId": "43c4da5f-6164-4088-ac5e-685f26b58c95",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "execution_count": null,
-      "outputs": []
+      "execution_count": 9,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Execution Time\n",
+            "\n",
+            "Power iteration (host)   = 2.38 s ± 382 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n",
+            "Power iteration (device) = 324 ms ± 7.39 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n",
+            "`eigvals` reference      = 49.1 s ± 0 ns per loop (mean ± std. dev. of 1 run, 1 loop each)\n"
+          ]
+        }
+      ]
     }
   ]
-}
+}