# Required libraries
import pandas as pd
import numpy as np
from sklearn.datasets import load_boston
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt
boston = load_boston()
print(boston.data.shape)
print(boston.feature_names)
print(boston.target.shape)
# Creating Pandas dataframe
bos = pd.DataFrame(boston.data)
print(bos.head())
bos['PRICE'] = boston.target
X = bos.drop('PRICE', axis = 1)
Y = bos['PRICE']
Y
# Test and train are two random subsets.Split data into these two subsets.
X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size = 0.33, random_state = 5)
print(X_train.shape)
print(X_test.shape)
print(Y_train.shape)
print(Y_test.shape)
# systamization
from sklearn.preprocessing import StandardScaler
std = StandardScaler()
X_train = std.fit_transform(X_train)
X_test = std.fit_transform(X_test)
from sklearn.linear_model import SGDRegressor
from sklearn.metrics import mean_squared_error, r2_score
clf = SGDRegressor()
clf.fit(X_train, Y_train)
Y_pred = clf.predict(X_test)
print("Coefficients: \n", clf.coef_)
print("Y_intercept", clf.intercept_)
IyBSZXF1aXJlZCBsaWJyYXJpZXMKaW1wb3J0IHBhbmRhcyBhcyBwZAppbXBvcnQgbnVtcHkgYXMgbnAKZnJvbSBza2xlYXJuLmRhdGFzZXRzIGltcG9ydCBsb2FkX2Jvc3Rvbgpmcm9tIHNrbGVhcm4ubW9kZWxfc2VsZWN0aW9uIGltcG9ydCB0cmFpbl90ZXN0X3NwbGl0CmltcG9ydCBtYXRwbG90bGliLnB5cGxvdCBhcyBwbHQKYm9zdG9uID0gbG9hZF9ib3N0b24oKQpwcmludChib3N0b24uZGF0YS5zaGFwZSkKcHJpbnQoYm9zdG9uLmZlYXR1cmVfbmFtZXMpCnByaW50KGJvc3Rvbi50YXJnZXQuc2hhcGUpCiMgQ3JlYXRpbmcgUGFuZGFzIGRhdGFmcmFtZQpib3MgPSBwZC5EYXRhRnJhbWUoYm9zdG9uLmRhdGEpCnByaW50KGJvcy5oZWFkKCkpCmJvc1snUFJJQ0UnXSA9IGJvc3Rvbi50YXJnZXQKWCA9IGJvcy5kcm9wKCdQUklDRScsIGF4aXMgPSAxKQpZID0gYm9zWydQUklDRSddClkKIyBUZXN0IGFuZCB0cmFpbiBhcmUgdHdvIHJhbmRvbSBzdWJzZXRzLlNwbGl0IGRhdGEgaW50byB0aGVzZSB0d28gc3Vic2V0cy4KWF90cmFpbiwgWF90ZXN0LCBZX3RyYWluLCBZX3Rlc3QgPSB0cmFpbl90ZXN0X3NwbGl0KFgsIFksIHRlc3Rfc2l6ZSA9IDAuMzMsIHJhbmRvbV9zdGF0ZSA9IDUpCnByaW50KFhfdHJhaW4uc2hhcGUpCnByaW50KFhfdGVzdC5zaGFwZSkKcHJpbnQoWV90cmFpbi5zaGFwZSkKcHJpbnQoWV90ZXN0LnNoYXBlKQojIHN5c3RhbWl6YXRpb24KZnJvbSBza2xlYXJuLnByZXByb2Nlc3NpbmcgaW1wb3J0IFN0YW5kYXJkU2NhbGVyCnN0ZCA9IFN0YW5kYXJkU2NhbGVyKCkKWF90cmFpbiA9IHN0ZC5maXRfdHJhbnNmb3JtKFhfdHJhaW4pClhfdGVzdCA9IHN0ZC5maXRfdHJhbnNmb3JtKFhfdGVzdCkKZnJvbSBza2xlYXJuLmxpbmVhcl9tb2RlbCBpbXBvcnQgU0dEUmVncmVzc29yCmZyb20gc2tsZWFybi5tZXRyaWNzIGltcG9ydCBtZWFuX3NxdWFyZWRfZXJyb3IsIHIyX3Njb3JlCmNsZiA9IFNHRFJlZ3Jlc3NvcigpCmNsZi5maXQoWF90cmFpbiwgWV90cmFpbikKWV9wcmVkID0gY2xmLnByZWRpY3QoWF90ZXN0KQpwcmludCgiQ29lZmZpY2llbnRzOiBcbiIsIGNsZi5jb2VmXykKcHJpbnQoIllfaW50ZXJjZXB0IiwgY2xmLmludGVyY2VwdF8p
(506, 13)
['CRIM' 'ZN' 'INDUS' 'CHAS' 'NOX' 'RM' 'AGE' 'DIS' 'RAD' 'TAX' 'PTRATIO'
'B' 'LSTAT']
(506,)
0 1 2 3 4 ... 8 9 10 11 12
0 0.00632 18.0 2.31 0.0 0.538 ... 1.0 296.0 15.3 396.90 4.98
1 0.02731 0.0 7.07 0.0 0.469 ... 2.0 242.0 17.8 396.90 9.14
2 0.02729 0.0 7.07 0.0 0.469 ... 2.0 242.0 17.8 392.83 4.03
3 0.03237 0.0 2.18 0.0 0.458 ... 3.0 222.0 18.7 394.63 2.94
4 0.06905 0.0 2.18 0.0 0.458 ... 3.0 222.0 18.7 396.90 5.33
[5 rows x 13 columns]
(339, 13)
(167, 13)
(339,)
(167,)
Coefficients:
[-1.20826388 0.71054081 -0.48592306 0.25711637 -1.23634687 2.92020304
-0.41924555 -2.63070839 1.76392467 -1.0457381 -2.0901674 1.02941922
-3.29717613]
Y_intercept [22.53076708]