代码收藏家技术教程 2025-05-12

Python多项式拟合详解与实践

文章目录

Python 多项式拟合

一、Numpy 实现

二、Torch 实现

三、拟合程度

3.1 展示

3.2 过拟合

3.3 欠拟合

Python 多项式拟合

一、Numpy 实现

多项式拟合原理：Python最小二乘法

这里使用第三方库来实现多项式拟合，而不是使用原始的方法：

numpy 库实现：

import numpy as np
import matplotlib.pyplot as plt

# 生成原始数据
# 生成 20 个在 [0, 1) 之间的随机数作为输入特征
x = np.sort(np.random.rand(100))
# 根据正弦函数生成对应的目标值，并添加噪声
y = np.sin(2 * np.pi * x) + 0.3 * np.random.randn(100)

p_is1 = np.poly1d(np.polyfit(x, y, 3))  # 拟合曲线

x_plot = np.linspace(0, 1, 100) 

plt.scatter(x, y, label='Training data', color='blue')
plt.plot(x_plot, p_is1(x_plot), label="predict data")
plt.title('fitting curve')
plt.xlabel('x')
plt.ylabel('y')
plt.legend()

1739436806_zfayb8n4k7.png1739436805904.png

二、Torch 实现

1739448558_dkfblgxycn.png1739448557822.png

import torch
import torch.nn as nn
from torch.utils.data import TensorDataset, DataLoader

# 1. 准备数据
# 生成一些示例数据
n_samples = 100
x1 = torch.randn(n_samples, 1)
x2 = torch.randn(n_samples, 1)
# 真实的权重和偏置
true_w1 = 2.0
true_w2 = 3.0
true_b = 1.0
# 生成标签
y = true_w1 * x1 + true_w2 * x2 + true_b + 0.1 * torch.randn(n_samples, 1)

# 合并特征
X = torch.cat((x1, x2), dim=1)

# 创建数据集和数据加载器
dataset = TensorDataset(X, y)
batch_size = 10
dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True)

# 2. 定义模型
class LinearRegression(nn.Module):
    def __init__(self):
        super(LinearRegression, self).__init__()
        self.linear = nn.Linear(2, 1)  # 输入维度为 2，输出维度为 1

    def forward(self, x):
        return self.linear(x)

model = LinearRegression()

# 3. 定义损失函数和优化器
criterion = nn.MSELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=0.01)

# 4. 训练模型
num_epochs = 100
for epoch in range(num_epochs):
    for inputs, labels in dataloader:
        # 前向传播
        outputs = model(inputs)
        loss = criterion(outputs, labels)

        # 反向传播和优化
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

    if (epoch + 1) % 10 == 0:
        print(f'Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}')

# 输出最终的权重和偏置
print("Final weights:", model.linear.weight.tolist())
print("Final bias:", model.linear.bias.item())

1739449817_swgyxklg7f.png1739449816827.png

三、拟合程度

3.1 展示

代码：

import numpy as np
import matplotlib.pyplot as plt

# 生成原始数据
# 生成 20 个在 [0, 1) 之间的随机数作为输入特征
x = np.sort(np.random.rand(100))
# 根据正弦函数生成对应的目标值，并添加噪声
y = np.sin(2 * np.pi * x) + 0.3 * np.random.randn(100)

p_over = np.poly1d(np.polyfit(x, y, 15))  # 过饱和曲线
p_under = np.poly1d(np.polyfit(x, y, 1))  # 过饱和曲线
p_is1 = np.poly1d(np.polyfit(x, y, 3))  # 拟合曲线
p_is2 = np.poly1d(np.polyfit(x, y, 4))  # 拟合曲线


# 绘制结果`
plt.figure(figsize=(12, 6))

x_plot = np.linspace(0, 1, 100) 

# 绘制训练集数据和拟合曲线
plt.subplot(2, 2, 1)
plt.scatter(x, y, label='Training data', color='blue')
plt.plot(x_plot, p_over(x_plot), label="predict data")
plt.title('1. Supersaturation fitting curve')
plt.xlabel('x')
plt.ylabel('y')
plt.legend()

# 绘制测试集数据和拟合曲线
plt.subplot(2, 2, 2)
plt.scatter(x, y, label='Training data', color='green')
plt.plot(x_plot, p_under(x_plot), label="predict data")
plt.title('2. Undersaturated fitting curve')
plt.xlabel('x')
plt.ylabel('y')
plt.legend()

# 绘制测试集数据和拟合曲线
plt.subplot(2, 2, 3)
plt.scatter(x, y, label='Training data', color='green')
plt.plot(x_plot, p_is1(x_plot), label="predict data")
plt.title('3. Three order fitting curve')
plt.xlabel('x')
plt.ylabel('y')
plt.legend()

# 绘制测试集数据和拟合曲线
plt.subplot(2, 2, 4)
plt.scatter(x, y, label='Training data', color='green')
plt.plot(x_plot, p_is2(x_plot), label="predict data")
plt.title('4. Four order fitting curve')
plt.xlabel('x')
plt.ylabel('y')
plt.legend()

plt.tight_layout()
plt.show()

1738978302_438sjyc25r.png1738978301378.png