Professional Documents
Culture Documents
ML Week 7 6607
ML Week 7 6607
WEEK-7
PROBLEM STATEMENT:
1. Build a multiple linear regression model using python for a particular data set by
PYTHON PROGRAM:
import numpy as np
import pandas as pd
file = "/content/50_Startups.csv"
df = pd.read_csv(file)
print(df,'\n')
x = df.iloc[:, :-1].values
y = df.iloc[:, -1].values
X=np.array(ct.fit_transform(x))
print(X)
X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.2,random_state=0)
print(X_train,'\n')
print(X_test,'\n')
print(y_train,'\n')
print(y_test,'\n')
model=LinearRegression()
model.fit(X_train,y_train)
print(model.intercept_,'\n')
print(model.coef_,'\n')
y_pred_train=model.predict(X_train)
y_pred_test=model.predict(X_test)
dataset=pd.DataFrame({'Actual':y_test,'Predicted':y_pred_test})
print(dataset,'\n')
#Visualization
plt.figure(figsize=(10,5))
plt.subplot(1,1,1)
plt.scatter(y_train,y_pred_train,color='blue')
plt.plot(y_train,y_train,color='red',linestyle='--')
plt.xlabel('Actual')
plt.ylabel('Predicted')
plt.grid()
Output: