Sai Ajay ajaymuktha

## datasets.py
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd

## dataset.py
dataset = pd.read_csv('Salary_Data.csv')
X = dataset.iloc[:,:-1].values
Y = dataset.iloc[:,1].values

## split.py
from sklearn.model_selection import train_test_split
X_train,X_test,Y_train,Y_test = train_test_split(X,Y, test_size=0.25, random_state = 0)

## fit.py
from sklearn.linear_model import LinearRegression
from sklearn.metrics import r2_score
regressor = LinearRegression()
regressor.fit(X_train,Y_train)

## predict.py
y_pred = regressor.predict(X_test)
print(r2_score(Y_test,y_pred))

## train.py
plt.scatter(X_train,Y_train, color = 'red')
plt.plot(X_train , regressor.predict(X_train), color='blue')
plt.title('Salary vs Experience')
plt.xlabel('Years of Experience')
plt.ylabel('Salary')
plt.show()

## test.py
plt.scatter(X_test,Y_test, color = 'red')
plt.plot(X_train , regressor.predict(X_train), color='blue')
plt.title('Salary vs Experience')
plt.xlabel('Years of Experience')
plt.ylabel('Salary')
plt.show()

## libraries.py
import nltk
import urllib
import bs4 as bs
import pandas as pd
import re
from nltk.corpus import stopwords

## fetching.py
text = ""
for paragraph in soup.find_all('p'):
    text += paragraph.text

## preprocessing.py
text = re.sub(r'\[[0-9]*\]',' ',text)
text = re.sub(r'\s+',' ',text)
text = text.lower()
text = re.sub(r'\d',' ',text)
text = re.sub(r'\s+',' ',text)
	import numpy as np
	import matplotlib.pyplot as plt
	import pandas as pd
	dataset = pd.read_csv('Salary_Data.csv')
	X = dataset.iloc[:,:-1].values
	Y = dataset.iloc[:,1].values
	from sklearn.model_selection import train_test_split
	X_train,X_test,Y_train,Y_test = train_test_split(X,Y, test_size=0.25, random_state = 0)
	from sklearn.linear_model import LinearRegression
	from sklearn.metrics import r2_score
	regressor = LinearRegression()
	regressor.fit(X_train,Y_train)
	y_pred = regressor.predict(X_test)
	print(r2_score(Y_test,y_pred))
	plt.scatter(X_train,Y_train, color = 'red')
	plt.plot(X_train , regressor.predict(X_train), color='blue')
	plt.title('Salary vs Experience')
	plt.xlabel('Years of Experience')
	plt.ylabel('Salary')
	plt.show()
	plt.scatter(X_test,Y_test, color = 'red')
	plt.plot(X_train , regressor.predict(X_train), color='blue')
	plt.title('Salary vs Experience')
	plt.xlabel('Years of Experience')
	plt.ylabel('Salary')
	plt.show()
	import nltk
	import urllib
	import bs4 as bs
	import pandas as pd
	import re
	from nltk.corpus import stopwords
	text = ""
	for paragraph in soup.find_all('p'):
	text += paragraph.text
	text = re.sub(r'\[[0-9]*\]',' ',text)
	text = re.sub(r'\s+',' ',text)
	text = text.lower()
	text = re.sub(r'\d',' ',text)
	text = re.sub(r'\s+',' ',text)