policy aipw v2

AIgoGracia · AIgoGracia · commit 1a6025b5e8e5 · 2025-09-28T00:10:20.000+09:00
diff --git a/book/cate_and_policy/policy_learning.ipynb b/book/cate_and_policy/policy_learning.ipynb
@@ -39,63 +39,248 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# 라이브러리와 난수 고정\n",
     "import numpy as np\n",
     "import matplotlib.pyplot as plt\n",
     "from matplotlib.patches import Rectangle\n",
-    "rng = np.random.default_rng(42)\n",
+    "import matplotlib.patches as mpatches"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Set random seed for reproducibility\n",
+    "np.random.seed(42)\n",
     "\n",
-    "# 데이터 생성\n",
+    "# Generate data\n",
     "n = 1000\n",
     "p = 4\n",
-    "X = rng.random((n, p))                   # 0~1 균등분포 공변량 4개\n",
-    "W = rng.binomial(1, 0.5, size=n)         # 무작위 처치(0/1), 확률 0.5\n",
-    "Y = 0.5*(X[:, 0] - 0.5) + (X[:, 1] - 0.5)*W + 0.1*rng.normal(size=n)\n",
+    "X = np.random.uniform(0, 1, (n, p))\n",
+    "W = np.random.binomial(1, 0.5, n)  # Independent from X and Y\n",
+    "Y = 0.5 * (X[:, 0] - 0.5) + (X[:, 1] - 0.5) * W + 0.1 * np.random.randn(n)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Normalize Y for plotting\n",
+    "y_norm = 1 - (Y - Y.min()) / (Y.max() - Y.min())\n",
+    "\n",
+    "# First plot: All data points\n",
+    "fig1, ax1 = plt.subplots(1, 1, figsize=(8, 6))\n",
+    "for i in range(n):\n",
+    "    if W[i] == 1:\n",
+    "        ax1.scatter(X[i, 0], X[i, 1], marker='o', s=100, \n",
+    "                   c=[y_norm[i]], cmap='gray', vmin=0, vmax=1, \n",
+    "                   edgecolors='black', linewidths=1)\n",
+    "    else:\n",
+    "        ax1.scatter(X[i, 0], X[i, 1], marker='D', s=80, \n",
+    "                   c=[y_norm[i]], cmap='gray', vmin=0, vmax=1,\n",
+    "                   edgecolors='black', linewidths=1)\n",
+    "ax1.set_xlabel('X1', fontsize=12)\n",
+    "ax1.set_ylabel('X2', fontsize=12)\n",
+    "ax1.set_title('All Data Points (○: Treated, ◇: Untreated)', fontsize=14)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Second plot: Separated by treatment\n",
+    "fig2, (ax2, ax3) = plt.subplots(1, 2, figsize=(14, 6))\n",
     "\n",
-    "# 시각화\n",
-    "y_norm = 1 - (Y - Y.min())/(Y.max() - Y.min())  # 0~1로 정규화\n",
-    "gray_colors = np.array([str(v) for v in y_norm])\n",
+    "# Untreated group\n",
+    "untreated_idx = W == 0\n",
+    "ax2.scatter(X[untreated_idx, 0], X[untreated_idx, 1], marker='D', s=80, \n",
+    "           c=y_norm[untreated_idx], cmap='gray', vmin=0, vmax=1,\n",
+    "           edgecolors='black', linewidths=1)\n",
+    "ax2.set_xlabel('X1', fontsize=12)\n",
+    "ax2.set_ylabel('X2', fontsize=12)\n",
+    "ax2.set_title('Untreated', fontsize=14)\n",
     "\n",
-    "plt.scatter(X[:, 0], X[:, 1], c=gray_colors, s=60, marker='o',\n",
-    "            edgecolors='k', linewidths=0.5)\n",
+    "# Treated group\n",
+    "treated_idx = W == 1\n",
+    "ax3.scatter(X[treated_idx, 0], X[treated_idx, 1], marker='o', s=100, \n",
+    "           c=y_norm[treated_idx], cmap='gray', vmin=0, vmax=1,\n",
+    "           edgecolors='black', linewidths=1)\n",
+    "ax3.set_xlabel('X1', fontsize=12)\n",
+    "ax3.set_ylabel('X2', fontsize=12)\n",
+    "ax3.set_title('Treated', fontsize=14)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Third plot: Policy regions\n",
+    "fig3, ax4 = plt.subplots(1, 1, figsize=(8, 6))\n",
     "\n",
-    "import matplotlib.pyplot as plt\n",
-    "from matplotlib.patches import Rectangle\n",
+    "# Define colors with transparency\n",
+    "col1 = (0.9960938, 0.7539062, 0.0273438, 0.35)  # Yellow-ish\n",
+    "col2 = (0.250980, 0.690196, 0.650980, 0.35)     # Teal-ish\n",
     "\n",
-    "plt.figure(figsize=(6, 5))\n",
+    "# Draw policy regions\n",
+    "rect1 = Rectangle((-0.1, -0.1), 0.6, 1.2, linewidth=0, \n",
+    "                  edgecolor='none', facecolor=col1, hatch='///')\n",
+    "rect2 = Rectangle((0.5, -0.1), 0.6, 0.6, linewidth=0, \n",
+    "                  edgecolor='none', facecolor=col1, hatch='///')\n",
+    "rect3 = Rectangle((0.5, 0.5), 0.6, 0.6, linewidth=0, \n",
+    "                  edgecolor='none', facecolor=col2, hatch='///')\n",
+    "ax4.add_patch(rect1)\n",
+    "ax4.add_patch(rect2)\n",
+    "ax4.add_patch(rect3)\n",
     "\n",
-    "# 1) 구역 칠하기 (사각형 3개)\n",
-    "col_treat = (0.25, 0.69, 0.65, 0.35)   # 초록 투명\n",
-    "col_notreat = (0.996, 0.754, 0.027, 0.35)  # 노랑 투명\n",
+    "# Plot data points\n",
+    "for i in range(n):\n",
+    "    if W[i] == 1:\n",
+    "        ax4.scatter(X[i, 0], X[i, 1], marker='o', s=100, \n",
+    "                   c=[y_norm[i]], cmap='gray', vmin=0, vmax=1, \n",
+    "                   edgecolors='black', linewidths=1)\n",
+    "    else:\n",
+    "        ax4.scatter(X[i, 0], X[i, 1], marker='D', s=80, \n",
+    "                   c=[y_norm[i]], cmap='gray', vmin=0, vmax=1,\n",
+    "                   edgecolors='black', linewidths=1)\n",
+    "\n",
+    "# Add text labels\n",
+    "ax4.text(0.75, 0.75, 'TREAT (A)', fontsize=16, ha='center', va='center')\n",
+    "ax4.text(0.25, 0.25, 'DO NOT TREAT (A^C)', fontsize=16, ha='left', va='center')\n",
+    "ax4.set_xlabel('X1', fontsize=12)\n",
+    "ax4.set_ylabel('X2', fontsize=12)\n",
+    "ax4.set_xlim(-0.1, 1.1)\n",
+    "ax4.set_ylim(-0.1, 1.1)\n",
+    "ax4.set_title('Policy Regions', fontsize=14)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Policy Evaluation Methods\n",
+    "print(\"=\" * 60)\n",
+    "print(\"POLICY EVALUATION RESULTS\")\n",
+    "print(\"=\" * 60)\n",
     "\n",
-    "# 왼쪽(0~0.5, 전체 y)\n",
-    "plt.gca().add_patch(Rectangle((-.1, -.1), 0.6, 1.2, facecolor=col_notreat, edgecolor='none', hatch='///'))\n",
-    "# 오른쪽 아래(0.5~1, 0~0.5)\n",
-    "plt.gca().add_patch(Rectangle((0.5, -.1), 0.6, 0.6, facecolor=col_notreat, edgecolor='none', hatch='///'))\n",
-    "# 오른쪽 위(0.5~1, 0.5~1)\n",
-    "plt.gca().add_patch(Rectangle((0.5, 0.5), 0.6, 0.6, facecolor=col_treat, edgecolor='none', hatch='///'))\n",
+    "# Method 1: Value of policy A (only valid in randomized setting)\n",
+    "A = (X[:, 0] > 0.5) & (X[:, 1] > 0.5)\n",
+    "value_estimate = np.mean(Y[A & (W == 1)]) * np.mean(A) + \\\n",
+    "                 np.mean(Y[~A & (W == 0)]) * np.mean(~A)\n",
+    "value_stderr = np.sqrt(\n",
+    "    np.var(Y[A & (W == 1)]) / np.sum(A & (W == 1)) * np.mean(A)**2 + \n",
+    "    np.var(Y[~A & (W == 0)]) / np.sum(~A & (W == 0)) * np.mean(~A)**2\n",
+    ")\n",
+    "print(f\"\\nMethod 1: Value of Policy A\")\n",
+    "print(f\"Value estimate: {value_estimate:.6f}\")\n",
+    "print(f\"Std. Error: {value_stderr:.6f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Method 2: Value of fixed treatment proportion (p=0.75)\n",
+    "p_treat = 0.75\n",
+    "value_estimate2 = p_treat * np.mean(Y[W == 1]) + (1 - p_treat) * np.mean(Y[W == 0])\n",
+    "value_stderr2 = np.sqrt(\n",
+    "    np.var(Y[W == 1]) / np.sum(W == 1) * p_treat**2 + \n",
+    "    np.var(Y[W == 0]) / np.sum(W == 0) * (1 - p_treat)**2\n",
+    ")\n",
+    "print(f\"\\nMethod 2: Value of Fixed Treatment Proportion (p={p_treat})\")\n",
+    "print(f\"Value estimate: {value_estimate2:.6f}\")\n",
+    "print(f\"Std. Error: {value_stderr2:.6f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Method 3: Treatment effect within policy region A\n",
+    "diff_estimate = (np.mean(Y[A & (W == 1)]) - np.mean(Y[A & (W == 0)])) * np.mean(A)\n",
+    "diff_stderr = np.sqrt(\n",
+    "    np.var(Y[A & (W == 1)]) / np.sum(A & (W == 1)) + \n",
+    "    np.var(Y[A & (W == 0)]) / np.sum(A & (W == 0))\n",
+    ") * np.mean(A)\n",
+    "print(f\"\\nMethod 3: Treatment Effect within Policy Region A\")\n",
+    "print(f\"Difference estimate: {diff_estimate:.6f}\")\n",
+    "print(f\"Std. Error: {diff_stderr:.6f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Method 4: Optimal policy difference\n",
+    "diff_estimate2 = (np.mean(Y[A & (W == 1)]) - np.mean(Y[A & (W == 0)])) * np.mean(A) / 2 + \\\n",
+    "                 (np.mean(Y[~A & (W == 0)]) - np.mean(Y[~A & (W == 1)])) * np.mean(~A) / 2\n",
+    "diff_stderr2 = np.sqrt(\n",
+    "    (np.mean(A) / 2)**2 * (\n",
+    "        np.var(Y[A & (W == 1)]) / np.sum(A & (W == 1)) + \n",
+    "        np.var(Y[A & (W == 0)]) / np.sum(A & (W == 0))\n",
+    "    ) + \n",
+    "    (np.mean(~A) / 2)**2 * (\n",
+    "        np.var(Y[~A & (W == 1)]) / np.sum(~A & (W == 1)) + \n",
+    "        np.var(Y[~A & (W == 0)]) / np.sum(~A & (W == 0))\n",
+    "    )\n",
+    ")\n",
+    "print(f\"\\nMethod 4: Optimal Policy Difference\")\n",
+    "print(f\"Difference estimate: {diff_estimate2:.6f}\")\n",
+    "print(f\"Std. Error: {diff_stderr2:.6f}\")\n",
     "\n",
-    "# 2) 점 찍기\n",
-    "plt.scatter(X[W==0,0], X[W==0,1],\n",
-    "            c=y_norm[W==0], cmap='gray', vmin=0, vmax=1,\n",
-    "            s=60, marker='^', edgecolors='k', linewidths=0.5,\n",
-    "            label=\"Untreated\")\n",
-    "plt.scatter(X[W==1,0], X[W==1,1],\n",
-    "            c=y_norm[W==1], cmap='gray', vmin=0, vmax=1,\n",
-    "            s=60, marker='o', edgecolors='k', linewidths=0.5,\n",
-    "            label=\"Treated\")\n",
+    "print(\"\\n\" + \"=\" * 60)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Additional analysis: Treatment effect heterogeneity\n",
+    "print(\"\\nADDITIONAL ANALYSIS\")\n",
+    "print(\"=\" * 60)\n",
     "\n",
-    "# 3) 텍스트 라벨 붙이기\n",
-    "plt.text(0.75, 0.75, \"TREAT (A)\", fontsize=14, ha='center', va='center')\n",
-    "plt.text(0.25, 0.25, \"DO NOT TREAT (A^C)\", fontsize=12, ha='center', va='center')\n",
+    "# Calculate treatment effects by region\n",
+    "te_in_A = np.mean(Y[A & (W == 1)]) - np.mean(Y[A & (W == 0)])\n",
+    "te_out_A = np.mean(Y[~A & (W == 1)]) - np.mean(Y[~A & (W == 0)])\n",
     "\n",
-    "plt.xlim(-0.1, 1.1)\n",
-    "plt.ylim(-0.1, 1.1)\n",
-    "plt.xlabel(\"X1\"); plt.ylabel(\"X2\")\n",
-    "plt.title(\"Policy Regions with Treated vs Untreated\")\n",
-    "plt.legend()\n",
-    "plt.tight_layout()\n",
-    "plt.show()\n"
+    "print(f\"\\nTreatment Effect Heterogeneity:\")\n",
+    "print(f\"Treatment effect in region A: {te_in_A:.6f}\")\n",
+    "print(f\"Treatment effect outside region A: {te_out_A:.6f}\")\n",
+    "print(f\"Difference in treatment effects: {te_in_A - te_out_A:.6f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Summary statistics\n",
+    "print(f\"\\nSummary Statistics:\")\n",
+    "print(f\"Proportion in region A: {np.mean(A):.3f}\")\n",
+    "print(f\"Proportion treated: {np.mean(W):.3f}\")\n",
+    "print(f\"Mean outcome (treated): {np.mean(Y[W == 1]):.6f}\")\n",
+    "print(f\"Mean outcome (untreated): {np.mean(Y[W == 0]):.6f}\")\n",
+    "print(f\"Overall treatment effect: {np.mean(Y[W == 1]) - np.mean(Y[W == 0]):.6f}\")"
    ]
   }
  ],