In [36]:
# Importing the libraries import library
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
# Enable image adjustment
% matplotlib notebook
#Chinese font display
plt . rc ( 'font' , family = 'SimHei' , size = 8 )
In [3]:
dataset = pd.read_csv('Salary_Data.csv')
dataset
Out[3]:
In [5]:
X = dataset.iloc[:, :-1].values
y = dataset.iloc[:, 1].values
X
Out[5]:
In [6]:
y
Out[6]:
In [28]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.3, random_state = 0)
In [29]:
from sklearn.linear_model import LinearRegression
regressor = LinearRegression()
regressor.fit(X_train, y_train)
Out[29]:
In [30]:
y_pred = regressor.predict(X_test)
In [31]:
# Visualising the Training set results
plt.scatter(X_train, y_train, color = 'red') # 训练的点
plt.plot(X_train, regressor.predict(X_train), color = 'blue') # 训练和训练的结果所画的线
plt.title(u'薪水和工作经验(训练集)')
plt.xlabel(u'经验')
plt.ylabel(u'薪水')
plt.show()
In [32]:
plt.scatter(X_test, y_test, color = 'red')# 测试的点
plt.plot(X_train, regressor.predict(X_train), color = 'blue') # 训练和训练的结果所画的线
plt.title(u'薪水和工作经验(测试集)')
plt.xlabel(u'经验')
plt.ylabel(u'薪水')
plt.show()