Assignment 4 Simple Linear Regression
Assignment 4 Simple Linear Regression
------------------------------------------------------------
# import dataset
data=pd.read_csv('delivery_time.csv')
data
sns.distplot(data['Delivery Time'])
sns.distplot(data['Sorting Time'])
# Renaming Columns
dataset=data.rename({'Delivery Time':'delivery_time', 'Sorting
Time':'sorting_time'},axis=1)
dataset
#Correlation Analysis
dataset.corr()
sns.regplot(x=dataset['sorting_time'],y=dataset['delivery_time'])
#Model Building
model=smf.ols("delivery_time~sorting_time",data=dataset).fit()
model.summary()
#Model Testing
# Finding Coefficient parameters
model.params
#Model Predictions
# Manual prediction for say sorting time 5
delivery_time = (6.582734) + (1.649020)*(5)
delivery_time
model.predict(data_pred)
# import dataset
data=pd.read_csv('Salary_Data.csv')
data
sns.distplot(data['YearsExperience'])
sns.distplot(data['Salary'])
# Renaming Columns
dataset1=data1.rename({'YearsExperience':'Experiance in year'},axis=1)
dataset1
#Correlation Analysis
dataset1.corr()
sns.regplot(x=dataset1['Experiance in year'],y=dataset1['Salary'])
#Model Building
model=smf.ols("Salary~YearsExperience",data=data1).fit()
model.summary()
#Model Testing
# Finding Coefficient parameters
model.params
#Model Predictions
# Manual prediction for say 3 Years Experience
Salary = (25792.200199) + (9449.962321)*(3)
Salary
data_pred=pd.DataFrame(new_data,columns=['YearsExperience'])
data_pred
model.predict(data_pred)