From f5f0f13f5fc5f80e3d131be204bd17e303cb989e Mon Sep 17 00:00:00 2001 From: bingyi Date: Thu, 23 Oct 2025 19:32:48 +0800 Subject: [PATCH] =?UTF-8?q?P250=20=E5=91=BD=E9=A2=981?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- P250 命题1/P250 命题1.md | 203 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 203 insertions(+) create mode 100644 P250 命题1/P250 命题1.md diff --git a/P250 命题1/P250 命题1.md b/P250 命题1/P250 命题1.md new file mode 100644 index 0000000..8ec0c17 --- /dev/null +++ b/P250 命题1/P250 命题1.md @@ -0,0 +1,203 @@ +## 1. 问题设定 + +我们有: +- \( r \):超额收益率向量 (我们想估计的随机向量)(维度 \(N\)) +- \( g \):原始预测向量 (观测到的随机向量)(维度 \(K\)) +- 线性估计形式: + +\[ +\hat{r}(g; b, A) = b + A g +\] +其中 \(b\) 是 \(N\) 维向量,\(A\) 是 \(N \times K\) 矩阵。 + +估计误差: + +\[ +q = r - \hat{r} +\] +均方误差(MSE): + +\[ +\text{MSE}(b,A) = E[q^T q] = E\left[ \sum_{n=1}^N q_n^2 \right] +\] + +--- + +## 2. 第一步:对 \(b\) 优化 + +我们要最小化 \(\text{MSE}(b,A)\),先对 \(b_n\) 求偏导(\(n=1,\dots,N\))。 + +注意: + +\[ +q_n = r_n - b_n - \sum_{k=1}^K A_{n,k} g_k +\] + +\[ +\frac{\partial \text{MSE}}{\partial b_n} = E\left[ 2 q_n \cdot (-1) \right] = -2 E[q_n] \overset{\text{令}}{=} 0 +\] +所以: + +\[ +E[q_n] = 0 +\] +即: + +\[ +E[r_n - b_n - \sum_{k=1}^K A_{n,k} g_k] = 0 +\] + +\[ +E[r_n] - b_n - \sum_{k=1}^K A_{n,k} E[g_k] = 0 +\] +因此: + +\[ +b_n = E[r_n] - \sum_{k=1}^K A_{n,k} E[g_k] +\] +写成向量形式: + +\[ +b = E[r] - A E[g] +\] +于是最优线性估计的形式变为: + +\[ +\hat{r} = E[r] + A (g - E[g]) +\] + + +取期望 + +\[ +E[\hat{r}] = E\big[ E[r] + A (g - E[g]) \big] +\] +由于 \( E[r] \) 是常数,\( A \) 是固定矩阵(不是随机的), + +\[ +E[\hat{r}] = E[r] + A \cdot E[g - E[g]] +\] +而 + +\[ +E[g - E[g]] = E[g] - E[g] = 0 +\] +所以 + +\[ +E[\hat{r}] = E[r] + A \cdot 0 = E[r] +\] + +因此估计是无偏的: + +\[ +E[\hat{r}] = E[r] +\] + +从而 \( E[q] = 0 \): +因为 + +\[ +q = r - \hat{r} +\] + +\[ +E[q] = E[r] - E[\hat{r}] = E[r] - E[r] = 0 +\] + + +--- + +## 3. 引入中心化变量 + +令: + +\[ +s = g - E[g], \quad p = r - E[r] +\] +则: + +\[ +q = p - A s +\] +并且 \(E[q] = 0\)。 + +--- + +## 4. 展开 MSE + + +\[ +\text{MSE}(A) = E[q^T q] = E[(p - A s)^T (p - A s)] +\] + +\[ += E[p^T p] - 2 E[p^T A s] + E[s^T A^T A s] +\] + +--- + +## 5. 对 \(A_{n,k}\) 求偏导 + +我们也可以直接对每个 \(A_{n,k}\) 求偏导来得到条件。 + + +\[ +q_n = p_n - \sum_{j=1}^K A_{n,j} s_j +\] + +\[ +\frac{\partial \text{MSE}}{\partial A_{n,k}} = E\left[ 2 q_n \cdot ( - s_k ) \right] = -2 E[q_n s_k] \overset{\text{令}}{=} 0 +\] +所以: + +\[ +E[q_n s_k] = 0 +\] +即: + +\[ +E\left[ \left( p_n - \sum_{j=1}^K A_{n,j} s_j \right) s_k \right] = 0 +\] + +\[ +E[p_n s_k] - \sum_{j=1}^K A_{n,j} E[s_j s_k] = 0 +\] +注意: +- \(E[p_n s_k] = \text{Cov}(r_n, g_k)\)(因为 \(p_n = r_n - E[r_n]\),\(s_k = g_k - E[g_k]\)) +- \(E[s_j s_k] = \text{Cov}(g_j, g_k)\)(即 \(\text{Var}(g)\) 的第 \((j,k)\) 元素) + +--- + +## 6. 矩阵形式 + +对每个 \(n\),有: + +\[ +\text{Cov}(r_n, g) - A_{n,\cdot} \cdot \text{Var}(g) = 0 +\] +其中 \(A_{n,\cdot}\) 是 \(A\) 的第 \(n\) 行。 + +将所有行堆起来: + +\[ +\text{Cov}(r, g) - A \cdot \text{Var}(g) = 0 +\] +这里 \(\text{Cov}(r,g)\) 是 \(N \times K\) 矩阵,元素为 \(\text{Cov}(r_n, g_k)\)。 + +所以: + +\[ +A = \text{Cov}(r, g) \cdot \text{Var}(g)^{-1} +\] + +--- + +## 7. 最终估计量 + +代入: + +\[ +\hat{r} = E[r] + \text{Cov}(r, g) \cdot \text{Var}(g)^{-1} \cdot (g - E[g]) +\] +这就是命题中给出的形式。