1. # coding=utf-8
    2. from sklearn.model_selection import train_test_split # 这里是引用了交叉验证
    3. from sklearn.linear_model import LinearRegression # 线性回归
    4. import numpy as np
    5. from data_load import load_data
    6. X,y = load_data()
    7. # 训练数据
    8. X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2)
    9. lin_reg = LinearRegression()
    10. for i in range(2):
    11. lin_reg.fit(X_train, y_train)
    12. feature_cols = ['so2', 'PM10', '悬挂高度', '电压等级']
    13. B = list(zip(feature_cols, lin_reg.coef_))
    14. print("系数 ", B)
    15. # 预测
    16. y_pred = lin_reg.predict(X_test)