data:image/s3,"s3://crabby-images/74c42/74c42d6876629e57be375d1154aeedffee5aa998" alt=""
data:image/s3,"s3://crabby-images/bb45e/bb45e6d19df2d4e33d905c5d01d46ea254f20755" alt=""
data:image/s3,"s3://crabby-images/7cca2/7cca22ed805e5842e1d79170e0f4e31c9ac8d775" alt=""
data:image/s3,"s3://crabby-images/2a76d/2a76df950678b32987903d4edc9810d1fa592fb1" alt=""
data:image/s3,"s3://crabby-images/a25b9/a25b9c441ee3489c4a456efa59e3f0689d3a3f90" alt=""
data:image/s3,"s3://crabby-images/4be3f/4be3f8ad5c60e6ab730f05a08ed794b0c54c6add" alt=""
data:image/s3,"s3://crabby-images/84c15/84c15bb867ccc368e1487e2b6a5d9821c5633329" alt=""
data:image/s3,"s3://crabby-images/273a5/273a50f69ebe6ba6ee972c21d1198713ef08d3c1" alt=""
data:image/s3,"s3://crabby-images/e7ed7/e7ed79bf0a87b8e4ad3442a0d84457f168213c8e" alt=""
data:image/s3,"s3://crabby-images/4a302/4a302799d778dbffd11c3fbd4360d175eba2d8b8" alt=""
import numpy;
from pandas import read_csv;
from matplotlib import pyplot as plt;
from sklearn.linear_model import LinearRegression
data = read_csv(
'D:\\PDM\\4.1\\data.csv'
)
data:image/s3,"s3://crabby-images/a2d28/a2d28a7b09669bb2989241d3f584b53f2c107107" alt=""
#第二步,画出散点图,求x和y的相关系数
plt.scatter(data.广告投入, data.销售额)
data.corr()
data:image/s3,"s3://crabby-images/91306/91306a1f4d473f126acd95f2da30d0bc25f908da" alt=""
广告投入 销售额
广告投入 1.000000 0.906923
销售额 0.906923 1.000000
#第三步,估计模型参数,建立回归模型
lrModel = LinearRegression()
x = data[['广告投入']]
y = data[['销售额']]
#训练模型
lrModel.fit(x, y)
#第四步、对回归模型进行检验
lrModel.score(x, y)
lrModel.fit(x, y)
Out[4]: LinearRegression(copy_X=True, fit_intercept=True, n_jobs=1, normalize=False)
lrModel.score(x, y)
Out[5]: 0.82250928811669455
#第五步、利用回归模型进行预测
lrModel.predict([[50], [40], [30]])
out:array([[ 150.53303965],
[ 113.15418502],
[ 75.7753304 ]])
#查看截距
alpha = lrModel.intercept_[0]
#查看参数
beta = lrModel.coef_[0][0]
alpha + beta*numpy.array([50, 40, 30])
array([ 150.53303965, 113.15418502, 75.7753304 ])
网友评论