22011P0515 ML Assignment
22011P0515 ML Assignment
Computations
def calculate_mean(data):
return sum(data) / len(data)
def calculate_median(data):
sorted_data = sorted(data)
n = len(sorted_data)
mid = n // 2
if n % 2 == 0:
return (sorted_data[mid - 1] + sorted_data[mid]) / 2
else:
return sorted_data[mid]
def calculate_mode(data):
frequency = {}
for value in data:
frequency[value] = frequency.get(value, 0) + 1
max_freq = max(frequency.values())
modes = [key for key, value in frequency.items() if value == max_freq]
return modes
mean = calculate_mean(data)
median = calculate_median(data)
mode = calculate_mode(data)
print(f"Mean: {mean}")
print(f"Median: {median}")
print(f"Mode: {mode}")
Output:
import pandas as pd
df = pd.read_csv('enjoy_sport.csv')
print(df)
def find_s(data):
hypothesis = data[0][:-1]
for instance in data:
if instance[-1] == 'Yes':
for i in range(len(hypothesis)):
if hypothesis[i] != instance[i]:
hypothesis[i] = '?'
return hypothesis
data = [
['Sunny', 'Warm', 'Normal', 'Strong', 'Yes'],
['Sunny', 'Warm', 'High', 'Strong', 'Yes'],
['Rainy', 'Cold', 'High', 'Strong', 'No'],
['Sunny', 'Warm', 'High', 'Weak', 'Yes'],
]
result = find_s(data)
print("Final Hypothesis:", result)
Output: