# 【PyTorch】多项式回归

## 1. 模型与代码实现

### 1.1. 模型

• 将多项式特征值预处理为线性模型的特征值。即

y = w_0+w_1x+w_2x^2+dots+w_nx^n

变换为

y=w_0+w_1z_1+w_2z_2+dots+w_nz_n

• 为了避免指数值过大，可以将

frac{x^i}{i!}

，即

y = w_0+w_1frac{x}{1!}+w_2frac{x^2}{2!}+dots+w_nfrac{x^n}{n!}

### 1.2. 代码实现

#### 1.2.1. 完整代码

import os
import numpy as np
import math, torch
from d2l import torch as d2l
import torch.nn as nn
from tensorboardX import SummaryWriter
from rich.progress import track

"""评估给定数据集上模型的损失"""
metric.reset()
X, y = X.to(device, non_blocking=True), y.to(device, non_blocking=True)
loss = criterion(net(X), y)
return metric[0] / metric[1]

"""加载数据集"""
dataset = TensorDataset(*data_arrays)
num_workers=num_workers, prefetch_factor=prefetch_factor)

if __name__ == '__main__':
# 全局参数设置
learning_rate = 0.01
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
num_epochs = 400
batch_size = 10
num_workers = 0
prefetch_factor = 2

max_degree = 20             # 多项式最高阶数
model_degree = 1           # 多项式模型阶数
n_train, n_test = 100, 100  # 训练集和测试集大小

true_w = np.zeros(max_degree+1)
true_w[0:4] = np.array([5, 1.2, -3.4, 5.6])

# 创建记录器
def get_logdir():
root = 'runs'
if not os.path.exists(root):
os.mkdir(root)
order = len(os.listdir(root)) + 1
return f'runs/exp{order}'
writer = SummaryWriter(get_logdir())

# 生成数据集
features = np.random.normal(size=(n_train + n_test, 1))
np.random.shuffle(features)
poly_features = np.power(features, np.arange(max_degree+1).reshape(1, -1))
for i in range(max_degree+1):
poly_features[:, i] /= math.gamma(i + 1)  # gamma(n)=(n-1)!
labels = np.dot(poly_features, true_w)
labels += np.random.normal(scale=0.1, size=labels.shape)    # 加高斯噪声服从N(0, 0.01)

poly_features, labels = [
torch.as_tensor(x, dtype=torch.float32) for x in [
poly_features, labels]]

# 创建模型
net = nn.Sequential(nn.Linear(model_degree+1, 1, bias=False)).to(device, non_blocking=True)
def init_weights(m):
if type(m) == nn.Linear:
nn.init.normal_(m.weight, mean=0, std=0.01)
net.apply(init_weights)
criterion = nn.MSELoss(reduction='none')
optimizer = torch.optim.SGD(net.parameters(), lr=learning_rate)

# 加载数据集
features_train, labels_train = poly_features[:n_train, :model_degree+1], labels[:n_train].reshape(-1, 1)
features_test, labels_test = poly_features[n_train:, :model_degree+1], labels[n_train:].reshape(-1, 1)

# 训练循环
metric = d2l.Accumulator(2)  # 损失的总和, 样本数量
for epoch in track(range(num_epochs)):
X, y = X.to(device, non_blocking=True), y.to(device, non_blocking=True)
loss = criterion(net(X), y)
loss.mean().backward()
optimizer.step()

}, epoch)
print("weights =", net[0].weight.data.cpu().numpy())

writer.close()


#### 1.2.2. 输出结果

• 采用1阶多项式（线性模型）拟合：

• 采用3阶多项式拟合

• 采用20阶多项式拟合

