VND - Openxmlformats Officedocument - Wordprocessingml.document&rendition 1
VND - Openxmlformats Officedocument - Wordprocessingml.document&rendition 1
AIM:
To write a Python program to import and export data using the Pandas library
functions.
PROCEDURE:
PROGRAM
import pandas as pd
df = pd.read_csv('student_data.csv')
print("Imported Data:")
print(df)
df.to_csv('student_data_exported.csv', index=False)
AIM
PROCEDURE
PROGRAM
import pandas as pd
data = {
df = pd.DataFrame(data)
df['Age'].fillna(df['Age'].mean(), inplace=True)
df['Salary'].fillna(df['Salary'].median(), inplace=True)
le = LabelEncoder()
df = df.drop_duplicates()
scaler = StandardScaler()
AIM
PROCEDURE
PROGRAM
import pandas as pd
data = {
df = pd.DataFrame(data)
y = df['Rent (Rs)']
model = LinearRegression()
model.fit(X_train, y_train)
y_pred = model.predict(X_test)
AIM
PROCEDURE
PROGRAM
iris = load_iris()
X = iris.data
y = iris.target
target_names = iris.target_names
# Step 2: Split into train and test
k=3
knn = KNeighborsClassifier(n_neighbors=k)
knn.fit(X_train, y_train)
# Step 4: Predict
y_pred = knn.predict(X_test)
for i in range(len(y_test)):
actual = target_names[y_test[i]]
predicted = target_names[y_pred[i]]
if y_test[i] == y_pred[i]:
else:
AIM
PROCEDURE
PROGRAM
iris = load_iris()
X = iris.data
y = iris.target
target_names = iris.target_names
clf = DecisionTreeClassifier(random_state=42)
clf.fit(X_train, y_train)
y_pred = clf.predict(X_test)
prediction = clf.predict(new_sample)
AIM
PROCEDURE
PROGRAM
iris = load_iris()
X = iris.data
y = iris.target
target_names = iris.target_names
# Step 2: Split dataset
model = GaussianNB()
model.fit(X_train, y_train)
y_pred = model.predict(X_test)
print("\nClassification Report:")
AIM:
PROCEDURE:
PROGRAM
iris = load_iris()
X = iris.data
y = iris.target
target_names = iris.target_names
model.fit(X_train, y_train)
y_pred = model.predict(X_test)
print("\nClassification Report:")
AIM
PROCEDURE
PROGRAM
import pandas as pd
url = "https://raw.githubusercontent.com/omairaasim/machine-learning-datasets/
main/heart.csv"
df = pd.read_csv(url)
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)
model.fit(X_train, y_train)
# Step 6: Predict
y_pred = model.predict(X_test)
AIM
PROCEDURE
PROGRAM
import pandas as pd
url = "https://raw.githubusercontent.com/omairaasim/machine-learning-datasets/
main/heart.csv"
df = pd.read_csv(url)
X = df.drop('target', axis=1)
y = df['target']
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)
rf = RandomForestClassifier(n_estimators=100, random_state=42)
rf.fit(X_train, y_train)
y_pred = rf.predict(X_test)
AIM
PROCEDURE
PROGRAM
X = iris.data
y = iris.target
model.fit(X_train, y_train)
y_pred = model.predict(X_test)
AIM
To implement the K-Means clustering algorithm on a dataset and visualize the clusters.
PROCEDURE
PROGRAM
import numpy as np
kmeans.fit(X)
y_kmeans = kmeans.predict(X)
centers = kmeans.cluster_centers_
plt.title("K-Means Clustering")
plt.xlabel("Feature 1")
plt.ylabel("Feature 2")
plt.grid(True)
plt.show()
AIM
PROCEDURE
PROGRAM
import numpy as np
data = load_iris()
X = data.data
y = data.target
target_names = data.target_names
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)
pca = PCA(n_components=2)
X_pca = pca.fit_transform(X_scaled)
plt.figure(figsize=(8, 6))
plt.legend()
plt.grid(True)
plt.show()