Skip to content

Instantly share code, notes, and snippets.

@amankharwal
Created June 22, 2021 11:42
Show Gist options
  • Save amankharwal/6507de8d60739ad5da661038562b88c4 to your computer and use it in GitHub Desktop.
Save amankharwal/6507de8d60739ad5da661038562b88c4 to your computer and use it in GitHub Desktop.
import numpy as np
import pandas as pd
from sklearn.linear_model import LinearRegression
from sklearn.utils import shuffle
data = pd.read_csv("https://raw.githubusercontent.com/amankharwal/Website-data/master/student-mat.csv")
data = data[["G1", "G2", "G3", "studytime", "failures", "absences"]]
predict = "G3"
x = np.array(data.drop([predict], 1))
y = np.array(data[predict])
from sklearn.model_selection import train_test_split
xtrain, xtest, ytrain, ytest = train_test_split(x, y, test_size=0.2)
linear_regression = LinearRegression()
linear_regression.fit(xtrain, ytrain)
predictions = linear_regression.predict(xtest)
# Calculation of R2 Score
from sklearn.model_selection import cross_val_score
print(cross_val_score(linear_regression, x, y, cv=10, scoring="r2").mean())
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment