Steps For Simple Regression Analysis
Steps For Simple Regression Analysis
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
Example:
df= pd.read_csv(r"C:\Yogesh Bhatt\9. Lectures\C. GEU\A. Course 8_Predictive
Analytics\2. EDA\placement.csv")
Example:
df= pd.read_excel(r"C:\Yogesh Bhatt\9. Lectures\C. GEU\A. Course 8_Predictive
Analytics\3. Regression Analysis\Attitude and Behaviour.xlsx")
df.head()
plt.scatter(df['kWh'],df['MT/Day'])
plt.xlabel('Energy Consumption (1000 xkWh)')
plt.ylabel('Production (MT/Day)')
X = df.iloc[:,0:1]
y = df.iloc[:,-1]
Step 6: Training the data set and arranging data in four arrays
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=2)
lr = LinearRegression()
lr.fit(X_train,y_train)
X_test
y_test
plt.scatter(df['kWh'],df['MT/Day'])
plt.plot(X_train.values,lr.predict(X_train), color='red')
plt.xlabel('Energy Consumption (1000 xkWh)')
plt.ylabel('Production (MT/Day)')
m = lr.coef_
m
b = lr.intercept_
b
print("MAE",mean_absolute_error(y_test,y_pred))
print("MSE",mean_squared_error(y_test,y_pred))
print("RMSE",np.sqrt(mean_squared_error(y_test,y_pred)))
print("R2",r2_score(y_test,y_pred))