0% found this document useful (0 votes)

39 views71 pages

Data Analysis Report With EDA

EDA

Uploaded by

pramatosh ray

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

39 views71 pages

Data Analysis Report With EDA

EDA

Uploaded by

pramatosh ray

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

Data Analysis Report with EDA

August 6, 2023

[1]: import os
import re
import numpy as np
import pandas as pd
import seaborn as sns
import [Link] as plt

[2]: import warnings

[Link]("ignore")

[3]: %matplotlib inline

[4]: def getDescribeOfNumericCols(df):

# apply(lambda x: '%.3f' %x).
output=[Link]().apply(lambda x: [Link]('{0:.3f}'.format)).T
output=output.reset_index()
output=[Link](columns = {[Link][0]:'Columns'})
output=[Link]('count',axis=1)
return output

[5]: def getNumberOfUnique(df):

output=[]
for var in [Link]:
[Link]([var,df[var].nunique()])
return [Link](output,columns=['Columns','No_Unique'])

[6]: def getDataTypes(df):

output=[Link]([Link])
output=output.reset_index()
output=[Link](columns = {[Link][0]:'Columns',output.
↪columns[1]:'DataTypes'})

output['Count']=[Link][0]
return output

[7]: def getNullReport(df):

output=[]
for var in [Link]:

1
[Link]([var,df[var].isnull().sum(),round(df[var].isnull().
↪ sum()*100/[Link][0],2)])
return [Link](output,columns=['Columns','Null_Count','Null_Percent'])

[8]: def getModeValues(df):

output=[Link]()
for var in [Link]:
temp=[Link](df[var].value_counts(normalize=True)*100).head(1).
↪reset_index()

temp_2=[Link](df[var].value_counts().head(1).reset_index())
temp['Columns']=var
temp['Mode']=temp['index']
temp['Frequency']=temp_2[var]
temp['Frequency_%']=temp[var]
temp=[Link](['index',var],axis=1)
output=[Link]([output,temp],axis=0)
output=output.reset_index()
output=[Link]('index',axis=1)
return output

[9]: def getDataQualityReport(df):

data_quality = getDataTypes(df)
data_quality = data_quality.
↪merge(getNumberOfUnique(df),on='Columns',how='left')

data_quality = data_quality.merge(getNullReport(df),on='Columns',how='left')
data_quality = data_quality.
↪merge(getDescribeOfNumericCols(df),on='Columns',how='left')

data_quality = data_quality.merge(getModeValues(df),on='Columns',how='left')
return data_quality

[178]: data = pd.read_csv("[Link]")

[11]: data_quality = getDataQualityReport(data)

data_quality

[11]: Columns DataTypes Count No_Unique Null_Count Null_Percent \

0 RowNumber int64 10000 10000 0 0.0
1 CustomerId int64 10000 10000 0 0.0
2 Surname object 10000 2932 0 0.0
3 CreditScore int64 10000 460 0 0.0
4 Geography object 10000 3 0 0.0
5 Gender object 10000 2 0 0.0
6 Age int64 10000 70 0 0.0
7 Tenure int64 10000 11 0 0.0
8 Balance float64 10000 6382 0 0.0
9 NumOfProducts int64 10000 4 0 0.0
10 HasCrCard int64 10000 2 0 0.0

2
11 IsActiveMember int64 10000 2 0 0.0
12 EstimatedSalary float64 10000 9999 0 0.0
13 Exited int64 10000 2 0 0.0
14 Complain int64 10000 2 0 0.0
15 Satisfaction Score int64 10000 5 0 0.0
16 Card Type object 10000 4 0 0.0
17 Point Earned int64 10000 785 0 0.0

mean std min 25% 50% \

0 5000.500 2886.896 1.000 2500.750 5000.500
1 15690940.569 71936.186 15565701.000 15628528.250 15690738.000
2 NaN NaN NaN NaN NaN
3 650.529 96.653 350.000 584.000 652.000
4 NaN NaN NaN NaN NaN
5 NaN NaN NaN NaN NaN
6 38.922 10.488 18.000 32.000 37.000
7 5.013 2.892 0.000 3.000 5.000
8 76485.889 62397.405 0.000 0.000 97198.540
9 1.530 0.582 1.000 1.000 1.000
10 0.706 0.456 0.000 0.000 1.000
11 0.515 0.500 0.000 0.000 1.000
12 100090.240 57510.493 11.580 51002.110 100193.915
13 0.204 0.403 0.000 0.000 0.000
14 0.204 0.403 0.000 0.000 0.000
15 3.014 1.406 1.000 2.000 3.000
16 NaN NaN NaN NaN NaN
17 606.515 225.925 119.000 410.000 605.000

75% max Mode Frequency Frequency_%

0 7500.250 10000.000 1 1 0.01
1 15753233.750 15815690.000 15634602 1 0.01
2 NaN NaN Smith 32 0.32
3 718.000 850.000 850 233 2.33
4 NaN NaN France 5014 50.14
5 NaN NaN Male 5457 54.57
6 44.000 92.000 37 478 4.78
7 7.000 10.000 2 1048 10.48
8 127644.240 250898.090 0.0 3617 36.17
9 2.000 4.000 1 5084 50.84
10 1.000 1.000 1 7055 70.55
11 1.000 1.000 1 5151 51.51
12 149388.247 199992.480 24924.92 2 0.02
13 0.000 1.000 0 7962 79.62
14 0.000 1.000 0 7956 79.56
15 4.000 5.000 3 2042 20.42
16 NaN NaN DIAMOND 2507 25.07
17 801.000 1000.000 408 26 0.26

3
[55]: data_quality.to_csv('Data_Quality_Report.csv',index=False)

0.1 EDA
[12]: import os
root_dir = "."
image_path = [Link](root_dir,"images")
[Link](image_path,exist_ok=True)

[13]: import os
root_dir = "."
excel_path = [Link](root_dir,"excel")
[Link](excel_path,exist_ok=True)

[14]: def save_fig(fig_id,tight_layout=True,fig_extension="png",resolution=300):

path=[Link](image_path,fig_id+"."+fig_extension)
print("Saving Figure",fig_id)
if tight_layout:
plt.tight_layout()
[Link](path, format=fig_extension,dpi=resolution)

0.1.1 Plots Functions

[15]: def getvariableListByType(df):
numerical_variables =[]
categorical_variables=[]
unknown_variables=[]

for var in [Link]:

if df[var].dtype in ['float8','float16','float32','float64',
'int8','int16','int32','int64',
'uint8','uint16','uint32','uint64']:
numerical_variables.append(var)
elif df[var].dtype in ['object','bool']:
categorical_variables.append(var)
else:
unknown_variables.append(var)
return numerical_variables,categorical_variables,unknown_variables

[16]: def getCrosstab(var1,var2,df):

print(f"Crosstab for {var1} vs {var2}")
print("-------------------------------")
print("Crosstab for Counts")
print("-------------------------------")
print([Link](df[var1],df[var2],margins=True))
print("-------------------------------")

4
print("Crosstab for Row wise Percentage")
print("-------------------------------")
print([Link](df[var1],df[var2],margins=True).apply(lambda r: r*200/r.
↪sum(),axis=1))

print("-------------------------------")
print("Crosstab for Column wise Percentage")
print("-------------------------------")
print([Link](df[var1],df[var2],margins=True).apply(lambda r: r*200/r.
↪sum(),axis=0))

[17]: def getValueCounts(df,variableList,minSamples=30):

sl_no = 0
for var in variableList:
if df[var].nunique()<minSamples:
sl_no+=1
print(f"| {sl_no} | {var} |")
print("----------------------")
print(df[var].value_counts())
print("----------------------")

[18]: def createHistogramPlots(df,numerical_variables,minSamples=30):

for var in numerical_variables:
if df[var].nunique()>=minSamples:
[Link](data=df,x=var,bins=25,kde=True,color="red")
[Link](f"Histogram of {var}")
save_fig(f"Histogram of {var}")
[Link]()

[19]: def␣
↪createHistogramPlotsWithHue(df,numerical_variables,variabl_hue,minSamples=30):

for var in numerical_variables:

if df[var].nunique()>=minSamples:
sns.
↪histplot(data=df,x=var,hue=variabl_hue,bins=25,kde=True,color="red")

[Link](f"Histogram of {var} with Hue {variabl_hue}")

save_fig(f"Histogram of {var} with Hue {variabl_hue}")
[Link]()

[20]: def createKDEPlots(df,numerical_variables,minSamples=30):

for var in numerical_variables:
if df[var].nunique()>=minSamples:
[Link]([Link][data['Survived']==0,var],␣
↪shade=True,color="r", label='Not Survived', alpha=.7)

[Link]([Link][data['Survived']==1,var], shade=True,␣
↪color="c", label='Survived', alpha=.6)

5
[Link](f"Density plot of {var}")
save_fig(f"Density plot of {var}")
[Link]()

[21]: def createBoxPlots(df,numerical_variables,minSamples=30):

for var in numerical_variables:
if df[var].nunique()>=minSamples:
[Link](data=df,y=var)
[Link](f"Boxplot of {var}")
save_fig(f"Boxplot of {var}")
[Link]()

[22]: def createBoxPlotsWithHue(df,numerical_variables,variabl_hue,minSamples=30):

for var in numerical_variables:
if df[var].nunique()>=minSamples:
[Link](data=df,y=var,x=variabl_hue)
[Link](f"Boxplot of {var} with Hue {variabl_hue}")
save_fig(f"Boxplot of {var} with Hue {variabl_hue}")
[Link]()

[23]: def createBarChart(df,varibleList,maxSamples=30,threshold=10):

sl_no=0
for var in varibleList:
if df[var].nunique()<maxSamples:
sl_no+=1
print(f"| {sl_no} | {var} |")
print("----------------------")
ax = df[var].value_counts().plot(kind="bar")

#Add count values to the bars

# for p in [Link]:
# ax.bar_label(p,label_type="edge",fontsize=10)

# for container in [Link]:

# for bar in container:
# height=bar.get_height()
# if height>threshold:
# width=bar.get_width()
# x = bar.get_x()
# y = bar.get_y()

# [Link](f'{height}', xy=(x+width/2, y+height/

2),xytext=(0,3),
↪

# textcoords="offset points",␣
ha='center',va='center', rotation=90)
↪

[Link](f'Count Plot of {var}')

[Link](rotation=90)

6
save_fig(f'Count Plot of {var}')
[Link]()
print("----------------------")

[24]: def␣
↪createBarChartWithHue(df,varibleList,variable_hue,maxSamples=30,threshold=10):

sl_no=0
for var in varibleList:
if df[var].nunique()<maxSamples:
sl_no+=1
print(f"| {sl_no} | {var} |")
print("----------------------")
ax = [Link](x=var, data=df,hue=variable_hue)
[Link](title=variable_hue, bbox_to_anchor=(1,1.02),loc='upper␣
↪left')

[Link](f'Count Plot of {var} with Hue {variable_hue}')

[Link](rotation=90)
save_fig(f'Count Plot of {var} with Hue {variable_hue}')
[Link]()
print("----------------------")

[25]: def custom_autocpt(val):

if val<5:
return ""
else:
return f'{val:.1f}%'

[26]: def createPieChart(df,varibleList,size=(8,6),maxSamples=30):

sl_no=0
for var in varibleList:
if df[var].nunique()<maxSamples:
sl_no+=1
print(f"| {sl_no} | {var} |")
print("----------------------")
[Link](figsize=size)

df[var].value_counts().plot(kind="pie",startangle=0,
autopct=custom_autocpt,ylabel='',
labeldistance=None,fontsize=10)

[Link](f'Pie Plot of {var}')

[Link](rotation=90)
[Link](bbox_to_anchor=(1,1.02),loc='upper left')
save_fig(f'Pie Plot of {var}')
[Link]()
print("----------------------")

7
[27]: def␣
↪createViolinPlotwithHue(df,numerical_variables,cross_var,variable_hue,minSamples=30):

for var in numerical_variables:

if df[var].nunique()>=minSamples:
[Link](cross_var,var, hue=variable_hue, data=df,split=True)
[Link](f"Violin Plot of {var} & {cross_var} with Hue␣
↪{variable_hue}")

save_fig(f"Violin Plot of {var} & {cross_var} with Hue␣

↪{variable_hue}")

[Link]()

[28]: def createScatterPlt(df,var_x,var_y,var_hue=None):

[Link](data=df,x=var_x,y=var_y,color='b',hue=var_hue)
[Link](f"Scatter Plot of {var_y} vs {var_x}")
[Link](f"{var_x}")
[Link](f"{var_y}")
[Link]()

[29]: def createCrosstabBarChart (var1,var2,df,figsize=(6,4),threshold=10):

[Link](figsize=figsize,dpi=300)
crosstab_df = [Link](df[var1],df[var2]).apply(lambda r: r*100/r.
↪sum(),axis=1)

ax = crosstab_df.plot(kind="bar", stacked=True, rot=0)

[Link](title=var2,bbox_to_anchor=(1,1.02), loc='upper left')
ax.set_xlabel(var1)
ax.tick_params(axis='x', rotation =90)
ax.set_ylabel("Count")
ax.set_title(f"Stacked Bar Chart: Crosstab for Row Wise %")

textcoords="offset points",␣
↪ha="center",va="center",rotation=90)

save_fig(f"Stacked Bar Cgart of Crosstab for row wise % for {var1} vs␣
↪{var2}")

[Link]()

8
0.1.2 Excel Crosstab
[45]: from openpyxl import Workbook

def getCrosstabInExcel(var1,var2,df,cmap='YlOrRd'):
ct1 = [Link](df[var1],df[var2]).style.
↪background_gradient(cmap=cmap,axis=None)

ct2 = [Link](df[var1],df[var2]).apply(lambda r: round(r*100/r.

↪sum(),2),axis=1).style.background_gradient(cmap=cmap,axis=None)

ct3 = [Link](df[var1],df[var2]).apply(lambda r: round(r*100/r.

↪sum(),2),axis=0).style.background_gradient(cmap=cmap,axis=None)

writer = [Link](f"Excel/Crosstab for {var1} vs {var2}.xlsx",␣

↪engine="openpyxl")

text1 = [Link]({"Text":[f"Crosstab for {var1} vs {var2}"]})

start_row=0
text1.
↪to_excel(writer,sheet_name="Sheet",index=False,header=False,startrow=start_row)

start_row=1
ct1.to_excel(writer,sheet_name="Sheet",index=True,startrow=start_row)

start_row= start_row+len([Link])+3
text2 = [Link]({"Text":["Crosstab for Row wise Percentage"]})
text2.
↪to_excel(writer,sheet_name="Sheet",index=False,header=False,startrow=start_row)

start_row=start_row+1
ct2.to_excel(writer,sheet_name="Sheet",index=True,startrow=start_row)

start_row= start_row+len([Link])+3
text3 = [Link]({"Text":["Crosstab for Column wise Percentage"]})
text3.
↪to_excel(writer,sheet_name="Sheet",index=False,header=False,startrow=start_row)

start_row=start_row+1
ct3.to_excel(writer,sheet_name="Sheet",index=True,startrow=start_row)
[Link]()

0.1.3 Test on Data

[30]: numerical_variables, categorical_variabls, unknown_variables =␣
↪getvariableListByType(data)

[31]: numerical_variables

9
[31]: ['RowNumber',
'CustomerId',
'CreditScore',
'Age',
'Tenure',
'Balance',
'NumOfProducts',
'HasCrCard',
'IsActiveMember',
'EstimatedSalary',
'Exited',
'Complain',
'Satisfaction Score',
'Point Earned']

[32]: categorical_variabls

[32]: ['Surname', 'Geography', 'Gender', 'Card Type']

[33]: unknown_variables

[33]: []

[36]: getValueCounts(data,numerical_variables)

| 1 | Tenure |
----------------------
2 1048
1 1035
7 1028
8 1025
5 1012
3 1009
4 989
9 984
6 967
10 490
0 413
Name: Tenure, dtype: int64
----------------------
| 2 | NumOfProducts |
----------------------
1 5084
2 4590
3 266
4 60
Name: NumOfProducts, dtype: int64
----------------------

[37]: getValueCounts(data,categorical_variabls)

11
----------------------
| 3 | Card Type |
----------------------
DIAMOND 2507
GOLD 2502
SILVER 2496
PLATINUM 2495
Name: Card Type, dtype: int64
----------------------

[34]: createHistogramPlots(data,numerical_variables)

Saving Figure Histogram of RowNumber

Saving Figure Histogram of CustomerId

12
Saving Figure Histogram of CreditScore

13
Saving Figure Histogram of Age

14
Saving Figure Histogram of Balance

15
Saving Figure Histogram of EstimatedSalary

16
Saving Figure Histogram of Point Earned

17
[35]: createBoxPlots(data,numerical_variables)

Saving Figure Boxplot of RowNumber

18
Saving Figure Boxplot of CustomerId

19
Saving Figure Boxplot of CreditScore

20
Saving Figure Boxplot of Age

21
Saving Figure Boxplot of Balance

22
Saving Figure Boxplot of EstimatedSalary

23
Saving Figure Boxplot of Point Earned

24
[38]: createBarChart(data,numerical_variables)

| 1 | Tenure |
----------------------
Saving Figure Count Plot of Tenure

25
----------------------
| 2 | NumOfProducts |
----------------------
Saving Figure Count Plot of NumOfProducts

26
----------------------
| 3 | HasCrCard |
----------------------
Saving Figure Count Plot of HasCrCard

27
----------------------
| 4 | IsActiveMember |
----------------------
Saving Figure Count Plot of IsActiveMember

28
----------------------
| 5 | Exited |
----------------------
Saving Figure Count Plot of Exited

29
----------------------
| 6 | Complain |
----------------------
Saving Figure Count Plot of Complain

30
----------------------
| 7 | Satisfaction Score |
----------------------
Saving Figure Count Plot of Satisfaction Score

31
----------------------

[39]: createBarChart(data,categorical_variabls)

| 1 | Geography |
----------------------
Saving Figure Count Plot of Geography

32
----------------------
| 2 | Gender |
----------------------
Saving Figure Count Plot of Gender

33
----------------------
| 3 | Card Type |
----------------------
Saving Figure Count Plot of Card Type

34
----------------------

[40]: createPieChart(data,numerical_variables)

| 1 | Tenure |
----------------------
Saving Figure Pie Plot of Tenure

35
----------------------
| 2 | NumOfProducts |
----------------------
Saving Figure Pie Plot of NumOfProducts

36
----------------------
| 3 | HasCrCard |
----------------------
Saving Figure Pie Plot of HasCrCard

37
----------------------
| 4 | IsActiveMember |
----------------------
Saving Figure Pie Plot of IsActiveMember

38
----------------------
| 5 | Exited |
----------------------
Saving Figure Pie Plot of Exited

39
----------------------
| 6 | Complain |
----------------------
Saving Figure Pie Plot of Complain

40
----------------------
| 7 | Satisfaction Score |
----------------------
Saving Figure Pie Plot of Satisfaction Score

41
----------------------

[41]: createPieChart(data,categorical_variabls)

| 1 | Geography |
----------------------
Saving Figure Pie Plot of Geography

42
----------------------
| 2 | Gender |
----------------------
Saving Figure Pie Plot of Gender

43
----------------------
| 3 | Card Type |
----------------------
Saving Figure Pie Plot of Card Type

44
----------------------

[42]: getCrosstab(var1='Gender',var2='Geography',df=data)

Crosstab for Gender vs Geography

-------------------------------
Crosstab for Counts
-------------------------------
Geography France Germany Spain All
Gender
Female 2261 1193 1089 4543
Male 2753 1316 1388 5457
All 5014 2509 2477 10000
-------------------------------
Crosstab for Row wise Percentage
-------------------------------
Geography France Germany Spain All
Gender
Female 49.768875 26.260180 23.970944 100.0

45
Male 50.448965 24.115815 25.435221 100.0
All 50.140000 25.090000 24.770000 100.0
-------------------------------
Crosstab for Column wise Percentage
-------------------------------
Geography France Germany Spain All
Gender
Female 45.093738 47.548824 43.964473 45.43
Male 54.906262 52.451176 56.035527 54.57
All 100.000000 100.000000 100.000000 100.00

[43]: createCrosstabBarChart(var1="Gender", var2="Geography",␣

↪df=data,figsize=(10,10),threshold=10)

Saving Figure Stacked Bar Cgart of Crosstab for row wise % for Gender vs
Geography
<Figure size 3000x3000 with 0 Axes>

[54]: createViolinPlotwithHue(data,numerical_variables,cross_var="Geography",variable_hue="Gender",m

Saving Figure Violin Plot of RowNumber & Geography with Hue Gender

46
Saving Figure Violin Plot of CustomerId & Geography with Hue Gender

47
Saving Figure Violin Plot of CreditScore & Geography with Hue Gender

48
Saving Figure Violin Plot of Age & Geography with Hue Gender

49
Saving Figure Violin Plot of Balance & Geography with Hue Gender

50
Saving Figure Violin Plot of EstimatedSalary & Geography with Hue Gender

51
Saving Figure Violin Plot of Point Earned & Geography with Hue Gender

52
[46]: getCrosstabInExcel(var1="Gender",var2="Geography",df=data)

0.2 Distribution Check and Testing

[47]: from [Link] import chi2_contingency

[111]: from scipy import stats

[98]: def testOfIndependanceChisq(data,variable1,variable2,alpha=0.05):

contingency_table = [Link](data[variable1],data[variable2])
contingency_table_2 = [Link](data[variable1],data[variable2]).
↪apply(lambda r: round(r*100/[Link][0],2),axis=0)

print("===============================================================")
print(f"Chi Sq Test of Independance for {variable1} vs {variable2} :␣
↪Results")

print("===============================================================")
print()

53
if (contingency_table<5).sum().sum()>0:
print("Chi-Square Test can't be conducted, since one of the proportion␣
↪< 5% \n")

print("Observed Contigency Table: \n",contingency_table)

else:
chi2, p_value, dof, expected = chi2_contingency(contingency_table)
print("> Chi Square Statistics:", round(chi2,3))
print("> p-value:",round(p_value,3))
print("> Degree of freedom:",dof)
print()
print("---------------------------------------------------------------")

if p_value<=alpha:
print(f"p value - {round(p_value,3)} is less than alpha - {alpha} ")
print(f"Conclusion: The Variables {variable1} and {variable2} are␣
↪Dependent: Reject H0")

else:
print(f"p value - {round(p_value,3)} is greater than alpha -␣
↪{alpha} ")

print(f"Conclusion: The Variables {variable1} and {variable2} are␣

↪Independent: Unable t reject H0")

print("---------------------------------------------------------------")

[105]: def getChisqReport(data,categorical_variables,cat_var):

i = 0
for var in categorical_variables:
print()
print("============")
print("Sl No : ",i)
testOfIndependanceChisq(data,variable1=cat_var,variable2=var,alpha=0.05)
print()
i+=1

[91]: testOfIndependanceChisq(data,variable1='Gender',variable2='Geography',alpha=0.
↪05)

===============================================================
Chi Sq Test of Independance for Gender vs Geography : Results
===============================================================

> Chi Square Statistics: 6.918

> p-value: 0.031
> Degree of freedom: 2

===============================================================
p value - 0.031 is less than alpha - 0.05

54
Conclusion: The Variables Gender and Geography are Dependednt: Reject H0
===============================================================

[107]: getChisqReport(data,categorical_variabls,cat_var="Gender")

============
Sl No : 0
===============================================================
Chi Sq Test of Independance for Gender vs Surname : Results
===============================================================

Chi-Square Test can't be conducted, since one of the proportion < 5%

Observed Contigency Table:

Surname Abazu Abbie Abbott Abdullah Abdulov Abel Abernathy Abramov \
Gender
Female 1 1 2 1 2 0 2 0
Male 1 0 2 0 0 1 0 1

Surname Abramova Abramovich … Zinachukwudi Zito Zotov Zotova Zox \

Gender …
Female 1 2 … 0 2 0 0 1
Male 1 3 … 1 4 1 1 0

Surname Zubarev Zubareva Zuev Zuyev Zuyeva

Gender
Female 3 0 0 0 1
Male 0 1 1 2 1

[2 rows x 2932 columns]

============
Sl No : 1
===============================================================
Chi Sq Test of Independance for Gender vs Geography : Results
===============================================================

> Chi Square Statistics: 6.918

> p-value: 0.031
> Degree of freedom: 2

---------------------------------------------------------------
p value - 0.031 is less than alpha - 0.05
Conclusion: The Variables Gender and Geography are Dependent: Reject H0
---------------------------------------------------------------

55
============
Sl No : 2
===============================================================
Chi Sq Test of Independance for Gender vs Gender : Results
===============================================================

Chi-Square Test can't be conducted, since one of the proportion < 5%

Observed Contigency Table:

Gender Female Male
Gender
Female 4543 0
Male 0 5457

============
Sl No : 3
===============================================================
Chi Sq Test of Independance for Gender vs Card Type : Results
===============================================================

> Chi Square Statistics: 12.02

> p-value: 0.007
> Degree of freedom: 3

---------------------------------------------------------------
p value - 0.007 is less than alpha - 0.05
Conclusion: The Variables Gender and Card Type are Dependent: Reject H0
---------------------------------------------------------------

[108]: getChisqReport(data,categorical_variabls,cat_var="Geography")

============
Sl No : 0
===============================================================
Chi Sq Test of Independance for Geography vs Surname : Results
===============================================================

Chi-Square Test can't be conducted, since one of the proportion < 5%

Observed Contigency Table:

Surname Abazu Abbie Abbott Abdullah Abdulov Abel Abernathy Abramov \
Geography
France 0 1 4 1 0 1 1 1
Germany 0 0 0 0 1 0 0 0

56
Spain 2 0 0 0 1 0 1 0

Surname Abramova Abramovich … Zinachukwudi Zito Zotov Zotova Zox \

Geography …
France 0 2 … 1 1 1 1 0
Germany 1 0 … 0 3 0 0 1
Spain 1 3 … 0 2 0 0 0

Surname Zubarev Zubareva Zuev Zuyev Zuyeva

Geography
France 3 1 1 0 0
Germany 0 0 0 1 1
Spain 0 0 0 1 1

[3 rows x 2932 columns]

============
Sl No : 1
===============================================================
Chi Sq Test of Independance for Geography vs Geography : Results
===============================================================

Chi-Square Test can't be conducted, since one of the proportion < 5%

Observed Contigency Table:

Geography France Germany Spain
Geography
France 5014 0 0
Germany 0 2509 0
Spain 0 0 2477

============
Sl No : 2
===============================================================
Chi Sq Test of Independance for Geography vs Gender : Results
===============================================================

> Chi Square Statistics: 6.918

> p-value: 0.031
> Degree of freedom: 2

---------------------------------------------------------------
p value - 0.031 is less than alpha - 0.05
Conclusion: The Variables Geography and Gender are Dependent: Reject H0
---------------------------------------------------------------

57
============
Sl No : 3
===============================================================
Chi Sq Test of Independance for Geography vs Card Type : Results
===============================================================

> Chi Square Statistics: 5.404

> p-value: 0.493
> Degree of freedom: 6

---------------------------------------------------------------
p value - 0.493 is greater than alpha - 0.05
Conclusion: The Variables Geography and Card Type are Independent: Unable t
reject H0
---------------------------------------------------------------

[141]: def test_normality(data,variable,alpha=0.05):

x=data[variable]

shapiro_stat,shapiro_pvalue = [Link](x)
print("=======================")
print(f"Normality Test for {variable}")
print("=======================")
print()
print("=======================")
print("Shapiro-wilk Test: ")
print("=======================")
print()
print("> Test Statistic: ",round(shapiro_stat,3))
print("> p-value:", round(shapiro_pvalue,3))
print()
print("Conclusion:")
print("-------------")
if shapiro_pvalue>alpha:
print(f"p value - {round(shapiro_pvalue,3)} is greater than alpha -␣
↪{alpha} ")

print(f"The Variable {variable} follows the Normal Distribution")

else:
print(f"p value - {round(shapiro_pvalue,3)} is less than alpha -␣
↪{alpha} ")

print(f"The Variable {variable} does not follow the Normal␣

↪Distribution")

print()
print("=======================")

58
print("Kolmogorov-Smirnov Test: ")
print("=======================")
print()
ks_stat, ks_pvalue = [Link](x,'norm')
print("Test Statistic:", round(ks_stat,3))
print("p-value:",round(ks_pvalue,3))
print()
print("Conclusion:")
print("-------------")
if ks_pvalue>alpha:
print(f"p value - {round(ks_pvalue,3)} is greater than alpha - {alpha}␣
↪")

print(f"The Variable {variable} follows the Normal Distribution")

else:
print(f"p value - {round(ks_pvalue,3)} is less than alpha - {alpha} ")
print(f"The Variable {variable} does not follow the Normal␣
↪Distribution")

print()

anderson_stat, anderson_critical_values, anderson_significance_levels =␣

↪[Link](x,dist="norm")

print()
print("=======================")
print("Anderson-Darling Test: ")
print("=======================")
print("Test Statistics:", round(anderson_stat,3))
print("Critical Values: ", anderson_critical_values)
print("Significance Levels: ", anderson_significance_levels/100)
print()
print("Conclusion:")
print("-------------")
if anderson_stat>anderson_critical_values[2]:
print(f"AD Statistics - {round(anderson_stat,3)} is greater than alpha␣
↪- {anderson_critical_values[2]} at {anderson_significance_levels[2]/100}␣

↪significance level")

print(f"The Variable {variable} does not follow the Normal␣

↪Distribution")

else:
print(f"AD Statistics - {round(anderson_stat,3)} is greater than alpha␣
↪- {anderson_critical_values[2]} at {anderson_significance_levels[2]/100}␣

↪significance level")

print(f"The Variable {variable} follows the Normal Distribution")

print()

[142]: test_normality(data,variable="CreditScore",alpha=0.05)

=======================

59
Normality Test for CreditScore
=======================

=======================
Shapiro-wilk Test:
=======================

> Test Statistic: 0.994

> p-value: 0.0

Conclusion:
-------------
p value - 0.0 is less than alpha - 0.05
The Variable CreditScore does not follow the Normal Distribution

=======================
Kolmogorov-Smirnov Test:
=======================

Test Statistic: 1.0

p-value: 0.0

Conclusion:
-------------
p value - 0.0 is less than alpha - 0.05
The Variable CreditScore does not follow the Normal Distribution

=======================
Anderson-Darling Test:
=======================
Test Statistics: 5.458
Critical Values: [0.576 0.656 0.787 0.918 1.092]
Significance Levels: [0.15 0.1 0.05 0.025 0.01 ]

Conclusion:
-------------
AD Statistics - 5.458 is greater than alpha - 0.787 at 0.05 significance level
The Variable CreditScore does not follow the Normal Distribution

[162]: import [Link] as sm

[219]: dist_names = ['beta',

'expon',
'gamma',
'lognorm',

60
'norm',
'pearson3',
'triang',
'uniform',
'weibull_min',
'weibull_max']

[236]: def createQQPlotforNormal(data,var):

# [Link](measurements).qqplot(line='s')
# [Link]()
measurements = data[var]
[Link](measurements, dist="norm", plot=pylab)
[Link]()

[237]: createQQPlotforNormal(data,var="CreditScore")

[215]: import [Link] as sm

[Link](data["CreditScore"],line='45',fit=True,dist=[Link])
[Link]()

61
[150]: # imports
import numpy as np
import [Link] as plt
import seaborn as sns
import [Link] as sc
import [Link] as sm

# define distributions
sample_size = 10000
standard_norm = [Link](size=sample_size)
heavy_tailed_norm = [Link](loc=0, scale=2, size=sample_size)
skewed_norm = [Link](a=5, size=sample_size)
skew_left_norm = [Link](a=-5, size=sample_size)

# plots for standard distribution

fig, ax = [Link](1, 2, figsize=(12, 7))
[Link](standard_norm,kde=True, color ='blue',ax=ax[0])
[Link](standard_norm).qqplot(line='s', ax=ax[1])

# plot for right-tailed distribution

62
fig, ax = [Link](1, 2, figsize=(12, 7))
[Link](skewed_norm).qqplot(line='s', ax=ax[1])
[Link](skewed_norm,kde=True, color ='blue',ax=ax[0])

# plot for left-tailed distribution

fig, ax = [Link](1, 2, figsize=(12, 7))
[Link](skew_left_norm).qqplot(line='s',color='red', ax=ax[1])
[Link](skew_left_norm,kde=True, color ='red',ax=ax[0])

# plot for heavy tailed distribution

fig, ax = [Link](1, 2, figsize=(12, 7))
[Link](heavy_tailed_norm).qqplot(line='s',color ='green', ax=ax[1])
[Link](heavy_tailed_norm,kde=True, color ='green',ax=ax[0])
[Link](standard_norm,kde=True, color ='red',ax=ax[0])

[150]: <AxesSubplot:ylabel='Count'>

63
64
[218]: #=====================================
# Fitting for distribution
#=====================================
import scipy
from [Link] import StandardScaler
import [Link]
import warnings
[Link]("ignore")

[231]: def fitDistributions(data,var,dist_names,nbins=50,alpha=0.05):

y=[Link](data[var])
x = [Link](len(y))
size = len(y)

sc=StandardScaler()
yy = [Link] (-1,1)
[Link](yy)
y_std =[Link](yy)
y_std = y_std.flatten()

# Set up empty lists to stroe results

chi_square = []
p_values = []

# Set up 50 bins for chi-square test

65
# Observed data will be approximately evenly distrubuted aross all bins
percentile_bins = [Link](0,100,nbins)
percentile_cutoffs = [Link](y_std, percentile_bins)
observed_frequency, bins = ([Link](y_std, bins=percentile_cutoffs))
cum_observed_frequency = [Link](observed_frequency)

# Loop through candidate distributions

for distribution in dist_names:
# Set up distribution and get fitted distribution parameters
dist = getattr([Link], distribution)
param = [Link](y_std)

# Obtain the KS test P statistic, round it to 5 decimal places

p = [Link](y_std, distribution, args=param)[1]
p = [Link](p, 5)
p_values.append(p)

# Get expected counts in percentile bins

# This is based on a 'cumulative distrubution function' (cdf)
cdf_fitted = [Link](percentile_cutoffs, *param[:-2], loc=param[-2],
scale=param[-1])
expected_frequency = []
for bin in range(len(percentile_bins)-1):
expected_cdf_area = cdf_fitted[bin+1] - cdf_fitted[bin]
expected_frequency.append(expected_cdf_area)

# calculate chi-squared
expected_frequency = [Link](expected_frequency) * size
cum_expected_frequency = [Link](expected_frequency)
ss = sum (((cum_expected_frequency - cum_observed_frequency) ** 2) /␣
↪cum_observed_frequency)

chi_square.append(ss)

# Collate results and sort by goodness of fit (best at top)

results = [Link]()
results['Distribution'] = dist_names
results['chi_square'] = chi_square
results['p_value'] = p_values
results['alpha']=alpha
results['conclusion']=results['p_value'].apply(lambda x: "Does Not Follow"␣
↪if x<alpha else "Follows")

results.sort_values(['chi_square'], inplace=True)
results=results.reset_index(drop=True)
return results

66
[235]: fitDistributions(data,var="CreditScore",dist_names=dist_names,nbins=50,alpha=0.
↪05)

[235]: Distribution chi_square p_value alpha conclusion

0 weibull_min 18.440621 0.01984 0.05 Does Not Follow
1 weibull_max 27.721445 0.03535 0.05 Does Not Follow
2 beta 50.066628 0.00261 0.05 Does Not Follow
3 pearson3 78.997425 0.00735 0.05 Does Not Follow
4 norm 85.628738 0.00097 0.05 Does Not Follow
5 lognorm 102.801133 0.00057 0.05 Does Not Follow
6 gamma 108.952496 0.00028 0.05 Does Not Follow
7 triang 5551.148172 0.00000 0.05 Does Not Follow
8 uniform 84810.244809 0.00000 0.05 Does Not Follow
9 expon 165161.908490 0.00000 0.05 Does Not Follow

[276]: import numpy as np

from [Link] import ks_2samp

def are_samples_from_same_distribution(sample1, sample2, alpha=0.05):

"""
Perform the Kolmogorov-Smirnov test to check if two samples come from the␣
↪same distribution.

Parameters:
sample1 (array-like): First sample data.
sample2 (array-like): Second sample data.
alpha (float): Significance level for the test (default is 0.05).

Returns:
(bool, float): A tuple containing the result of the test (True if same␣
↪distribution, False otherwise)

and the p-value of the test.

"""
stat, p_value = ks_2samp(sample1, sample2)
result = p_value > alpha
return result, p_value

# Example usage:
sample1 = [Link](loc=0, scale=1, size=1000)
sample2 = [Link](loc=0, scale=1, size=1000)

result, p_value = are_samples_from_same_distribution(sample1, sample2)

if result:
print("The two samples come from the same distribution.")
else:
print("The two samples do not come from the same distribution.")

67
print(f"P-value: {p_value}")

The two samples come from the same distribution.

P-value: 0.9357699014782725

[287]: def␣
↪test_continuous_categorical_ANOVA(data,continuous_variable,categorical_variable,alpha=0.

↪05):

groups = [group for _,group in [Link](categorical_variable)]

statistics, p_value = stats.f_oneway(*[group[continuous_variable] for group␣
↪in groups])

print("---------------------------------------------------------------")
print(f"One-Way ANOVA Test of between {continuous_variable} vs␣
↪{categorical_variable} : Results")

print("---------------------------------------------------------------")
# print(groups)
print("> F Statistics:", round(statistics,3))
print("> p-value:",round(p_value,3))
print()

if p_value<=alpha:
print(f"Conclusion: The Variables {continuous_variable} and␣
↪{categorical_variable} are Dependent: Reject H0")

else:
print(f"Conclusion: The Variables {continuous_variable} and␣
↪{categorical_variable} are Independent: Unable to reject H0")

[288]: test_continuous_categorical_ANOVA(data,continuous_variable='Balance',categorical_variable='Gen
↪05)

---------------------------------------------------------------
One-Way ANOVA Test of between Balance vs Gender : Results
---------------------------------------------------------------
> F Statistics: 1.461
> p-value: 0.227

Conclusion: The Variables Balance and Gender are Independent: Unable to reject
H0

[289]: def test_continuous_relationship(data,variable1,variable2,method='pearson'):

x=data[variable1]
y=data[variable2]

if method=='pearson':
correlation_coef,p_value = [Link](x,y)
elif method=='spearman':
correlation_coef,p_value = [Link](x,y)

68
else:
raise ValueError("invalid correlation method specified. Choose␣
↪'pearson' or 'spearman'")

print("correlation Coefficient: ", round(correlation_coef,3))

print("p-value:", round(p_value,3))

[297]: test_continuous_relationship(data,variable1="CreditScore",variable2="Point␣
↪Earned",method='pearson')

correlation Coefficient: 0.0

p-value: 0.994

0.3 Outlier Detection

[298]: def find_iqr(x):
return [Link](*[Link](x,[0.75,0.25]))

[335]: # def outlier_cap_upper(x,upper):

# if x>upper:
# return upper
# else:
# return x

[336]: def is_outlier_present(max_value,min_value,upper,lower):

if max_value>upper or min_value<lower:
return 'Outlier Present'
else:
return 'No Outlier'

[337]: def getOutlierInformation(data,numerical_variables,minSamples=30):

outlier_df = []
for var in numerical_variables:
if data[var].nunique()>minSamples:
third_quantile = [Link](data[var],0.75)
first_quantile = [Link](data[var],0.25)
iqr = third_quantile - first_quantile
upper = round(third_quantile + 1.5*iqr,3)
lower = round(first_quantile - 1.5*iqr,3)

max_value = data[var].max()
min_value = data[var].min()

outlier_conclusion =␣
↪is_outlier_present(max_value,min_value,upper,lower)
outlier_df.
↪append([var,upper,lower,max_value,min_value,outlier_conclusion])

69
outlier_df = [Link](outlier_df,columns=['Variable','Upper␣
↪ Limit','Lower Limit','Max Value', 'Min Value', 'Conclusion'])

return outlier_df

[338]: getOutlierInformation(data,numerical_variables,minSamples=30)

[338]: Variable Upper Limit Lower Limit Max Value Min Value \
0 RowNumber 1.499950e+04 -4.998500e+03 10000.00 1.00
1 CustomerId 1.594029e+07 1.544147e+07 15815690.00 15565701.00
2 CreditScore 9.190000e+02 3.830000e+02 850.00 350.00
3 Age 6.200000e+01 1.400000e+01 92.00 18.00
4 Balance 3.191106e+05 -1.914664e+05 250898.09 0.00
5 EstimatedSalary 2.969675e+05 -9.657710e+04 199992.48 11.58
6 Point Earned 1.387500e+03 -1.765000e+02 1000.00 119.00

Conclusion
0 No Outlier
1 No Outlier
2 Outlier Present
3 Outlier Present
4 No Outlier
5 No Outlier
6 No Outlier

0.4 Logging Method

[56]: import os
import sys
import datetime
import logging

'''
This file configures logging method
'''

root_dir = "."
log_file_path = [Link](root_dir, 'logs')
[Link](log_file_path, exist_ok=True)

timeStamp = [Link]().strftime("%Y%m%d-%H%M%S")
date_of_script_run = [Link]().strftime("%d/%m/%y")
log_file_name = log_file_path + '/' + f'log_customer_segmentation_{timeStamp}'

def genLogger(log_file_name, gen_console_log=False, gen_file_log=True):

70
"""
This file creates logger
:param log_file_name:
:param gen_console_log:
:param gen_file_log:
:return:
"""
logger = [Link]()
[Link]([Link])
log_formatter = [Link]("(asctime)s [%(levelname)-5.5s]␣
↪%(message)s")

console_handler = [Link]([Link])
console_handler.setFormatter(log_formatter)

file_handler = [Link](f"{log_file_name}.log", mode="a")

file_handler.setFormatter(log_formatter)

if not [Link]():
if gen_console_log:
[Link](console_handler)
if gen_file_log:
[Link](file_handler)
return logger

def closeLogger(logger):
"""
This function closes an open handler
:param logger:
:return:
"""
for handler in list([Link]):
[Link]()
[Link](handler)

# logger = genLogger(log_file_name, gen_console_log=True, gen_file_log=True)

# closeLogger(logger)

Chart Final Class
No ratings yet
Chart Final Class
8 pages
Data Visualization Examples
No ratings yet
Data Visualization Examples
7 pages
Data Analyzer
No ratings yet
Data Analyzer
10 pages
The Goal of This Part Is To Use Descriptive Statistics and Visualization To Better Understand Your Data
No ratings yet
The Goal of This Part Is To Use Descriptive Statistics and Visualization To Better Understand Your Data
3 pages
Data Visualization for Analysts
No ratings yet
Data Visualization for Analysts
159 pages
Data Visualization
No ratings yet
Data Visualization
159 pages
Data Visualization
No ratings yet
Data Visualization
70 pages
Mastering Data Visualization Techniques 1728896857
No ratings yet
Mastering Data Visualization Techniques 1728896857
85 pages
Mastering Data Visualization Techniques (Part 1)
No ratings yet
Mastering Data Visualization Techniques (Part 1)
20 pages
Unit 6
No ratings yet
Unit 6
3 pages
Data Visualization Tools for EDA
No ratings yet
Data Visualization Tools for EDA
10 pages
EDA Cheatsheet - Class Note
No ratings yet
EDA Cheatsheet - Class Note
29 pages
EDA Cheatsheet - Class Note
No ratings yet
EDA Cheatsheet - Class Note
29 pages
EDA+Cheatsheet+ +Class+Note
No ratings yet
EDA+Cheatsheet+ +Class+Note
29 pages
EDA Code Cheatsheet for Data Analysis
No ratings yet
EDA Code Cheatsheet for Data Analysis
29 pages
6) Exploratory Data Analysis
No ratings yet
6) Exploratory Data Analysis
29 pages
EDA+Cheatsheet+ +Class+Note
No ratings yet
EDA+Cheatsheet+ +Class+Note
29 pages
Mayank Chaudhary DEV Practicals
No ratings yet
Mayank Chaudhary DEV Practicals
14 pages
Exploratory Data Analysis
No ratings yet
Exploratory Data Analysis
4 pages
Data Analysis with Python Scripts
No ratings yet
Data Analysis with Python Scripts
9 pages
Exploratory Data Analysis of Heart Disease Dataset 1737826105
No ratings yet
Exploratory Data Analysis of Heart Disease Dataset 1737826105
50 pages
EDA of Iris Dataset in Python
No ratings yet
EDA of Iris Dataset in Python
12 pages
Introduction To EDA: Exploratory Data Analysis (EDA) in Data Science
No ratings yet
Introduction To EDA: Exploratory Data Analysis (EDA) in Data Science
4 pages
EDA Cheat Sheet - Supercharge Your Data Analysis!
No ratings yet
EDA Cheat Sheet - Supercharge Your Data Analysis!
2 pages
Ad3301 Unit 1
No ratings yet
Ad3301 Unit 1
15 pages
Univariate Analysis in Machine Learning
No ratings yet
Univariate Analysis in Machine Learning
17 pages
EDA Step by Step
No ratings yet
EDA Step by Step
2 pages
Exp 2 SDK Ok
No ratings yet
Exp 2 SDK Ok
18 pages
Keeratsi HW8
No ratings yet
Keeratsi HW8
17 pages
Ai&Ml Bail606 ML Lab Manual
No ratings yet
Ai&Ml Bail606 ML Lab Manual
50 pages
Exploratory Data Analysis (EDA) in Python
No ratings yet
Exploratory Data Analysis (EDA) in Python
6 pages
ML Lab - Exp1-10
No ratings yet
ML Lab - Exp1-10
4 pages
Dsa 1
No ratings yet
Dsa 1
8 pages
Data Visualization
No ratings yet
Data Visualization
10 pages
Machine Learning
No ratings yet
Machine Learning
149 pages
DSBDAL - Assignment No 9
No ratings yet
DSBDAL - Assignment No 9
12 pages
Delhivery Data Processing Overview
No ratings yet
Delhivery Data Processing Overview
79 pages
Iris Dataset Feature Analysis
No ratings yet
Iris Dataset Feature Analysis
3 pages
Haberman Cancer Survival Analysis Guide
No ratings yet
Haberman Cancer Survival Analysis Guide
1 page
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
89 pages
Data Science and Analtics Laboratory
No ratings yet
Data Science and Analtics Laboratory
21 pages
fdp.08.5.2024 (2prog)
No ratings yet
fdp.08.5.2024 (2prog)
6 pages
FDS All Practicals
No ratings yet
FDS All Practicals
10 pages
Fds Slips
No ratings yet
Fds Slips
6 pages
Advanced Plot Types With Seaborn
No ratings yet
Advanced Plot Types With Seaborn
8 pages
Data Analisis 2
No ratings yet
Data Analisis 2
13 pages
ML Labmanual
No ratings yet
ML Labmanual
33 pages
Lab Programs 1 To 5
No ratings yet
Lab Programs 1 To 5
12 pages
Machine
No ratings yet
Machine
10 pages
Batch1 Ds
No ratings yet
Batch1 Ds
15 pages
Aphical Representation
No ratings yet
Aphical Representation
12 pages
06 Seaborn
No ratings yet
06 Seaborn
13 pages
DV Lab Fat
No ratings yet
DV Lab Fat
7 pages
Student Alcohol Use Analysis
No ratings yet
Student Alcohol Use Analysis
20 pages
Lab 5 &6
No ratings yet
Lab 5 &6
6 pages
ML 5.0
No ratings yet
ML 5.0
2 pages
Time Projection Model - Nick Matthews
100% (1)
Time Projection Model - Nick Matthews
6 pages
Data Science Lab Manual for 7th Sem
No ratings yet
Data Science Lab Manual for 7th Sem
64 pages
Identifying and Formulating The Research Problem: October 2018
No ratings yet
Identifying and Formulating The Research Problem: October 2018
14 pages
Questionnaire Qualitative Research
No ratings yet
Questionnaire Qualitative Research
1 page
Admsci 12 00099 With Cover
No ratings yet
Admsci 12 00099 With Cover
18 pages
Student Vendor Preferences Study
100% (1)
Student Vendor Preferences Study
27 pages
Minika Bassey E-WPS Office
No ratings yet
Minika Bassey E-WPS Office
5 pages
Abstract For MCD
No ratings yet
Abstract For MCD
11 pages
Markov Analysis Details
No ratings yet
Markov Analysis Details
6 pages
Stuvia 5424414 Iop2601 Assignment 4 Complete Answers Due 27 May 2024 Semester 12024 Unisa
No ratings yet
Stuvia 5424414 Iop2601 Assignment 4 Complete Answers Due 27 May 2024 Semester 12024 Unisa
17 pages
Virtual University of Pakistan
No ratings yet
Virtual University of Pakistan
11 pages
MBA Proposal Defense Presentation
No ratings yet
MBA Proposal Defense Presentation
23 pages
Lecture 6
No ratings yet
Lecture 6
28 pages
The Effects of Broken Home
No ratings yet
The Effects of Broken Home
12 pages
Digital Transformation Challenges
No ratings yet
Digital Transformation Challenges
13 pages
Deep Fake Technology
No ratings yet
Deep Fake Technology
10 pages
Ocr History Coursework Help
100% (2)
Ocr History Coursework Help
5 pages
C-SEA College Inception Report
No ratings yet
C-SEA College Inception Report
9 pages
Machine Learning Interview Questions
No ratings yet
Machine Learning Interview Questions
20 pages
West African Cashew Market Trends
No ratings yet
West African Cashew Market Trends
16 pages
Fmed 10 1174631
No ratings yet
Fmed 10 1174631
7 pages
Sample Organizational Assessment Template PDF
100% (1)
Sample Organizational Assessment Template PDF
3 pages
Education Student Evaluation Report
No ratings yet
Education Student Evaluation Report
4 pages
Reinforcement Learning Overview
No ratings yet
Reinforcement Learning Overview
49 pages
AI's Role in Diagnosing Hospital Patients
No ratings yet
AI's Role in Diagnosing Hospital Patients
10 pages
Understanding Management Control Functions
No ratings yet
Understanding Management Control Functions
18 pages
Social Media and Political Awareness in Pakistan A Case Study of Youth
No ratings yet
Social Media and Political Awareness in Pakistan A Case Study of Youth
14 pages
Training Needs Analysis Template
No ratings yet
Training Needs Analysis Template
7 pages
A Sadiy Ah 23232023 A Jeb A 108749
No ratings yet
A Sadiy Ah 23232023 A Jeb A 108749
9 pages
MECH 215 - Instrumentation and Measurement Week 3, Lecture 3 Uncertainty Analysis
No ratings yet
MECH 215 - Instrumentation and Measurement Week 3, Lecture 3 Uncertainty Analysis
27 pages