Assignment 1
Assignment 1
Code:
import pandas as pd
import numpy as np
df = pd.read_csv("C:\\Users\\user\\Desktop\\Sem 6\\SI\\salary_data.csv")
df.head()
df.shape
X = df.loc[:,"YearsExperience"]
y = df.loc[:,"Salary"]
# Splitting X and Y into X_train, y_train, X_test,y_test
X_train = X.iloc[:21]
y_train = y.iloc[:21]
X_test = X.iloc[21:]
y_test = y.iloc[21:]
X_train,y_train
N = len(X_train)
sum_X = sum(X_train)
sum_Y = sum(y_train)
sum_XY = sum(X_train*y_train)
sum_X_square = sum(X_train**2)
a = (sum_Y - (b*sum_X))/N
# Predicting Value
def pred(a,b,x):
return a + b*x
for x in X_train:
for x in X_test:
c = pred(a,b,6)
c
pred_test = pred(a,b,X_test)
pred_train =pred(a,b,X_train)
pred_test
pred_train
plt.plot(X_train,pred_train,color="yellow")
plt.scatter(X_train,y_train)
plt.show()
plt.xlabel('X_test')
plt.ylabel('Values')
plt.legend()
plt.show()
error_list = []
def mean_squared_error(true,pred):
squared_error = (true - pred)**2
error_list.append(squared_error)
return mse
mse_test = mean_squared_error(y_test,pred_test)
mse_train = mean_squared_error(y_train,pred_train)
def abs_error(true,pred):
print(f"Error is:\n{error}")
final = sum(error)
ae = final/len(true)
return ae
error_list_mse = []
error_list_mae = []
for i in range(N):
mae = abs_error(y_train,y_pred)
mse = mean_squared_error(y_train,y_pred)
error_list_mse.append(mse)
error_list_mae.append(mae)