Time Series Analysis Group 9
Time Series Analysis Group 9
import pandas as pd
data = {
'value': [i**2 for i in range(365)] # Sample data: squares of numbers from 0 to 364
# Create DataFrame
df = pd.DataFrame(data)
df['date'] = pd.to_datetime(df['date'])
df.set_index('date', inplace=True)
print("----------------------------")
print("Data Summary:")
print(df.describe())
plt.figure(figsize=(10, 6))
plt.ylabel('Value')
plt.legend()
plt.grid(True)
plt.show()
OUTPUT:
import pandas as pd
data = {
df = pd.DataFrame(data)
print("Original DataFrame:")
print(df)
print(df['Name'])
print(df['Age'])
# Filtering data
print("\nFiltering data:")
print(df)
# Deleting a column
df.drop(columns=['Grade'], inplace=True)
print(df)
OUTPUT:
Original DataFrame:
Name Age Grade
0 John 25 A
1 Anna 24 B
2 Peter 26 A
3 Linda 23 B
4 Sophia 27 A
Filtering data:
Name Age Grade
0 John 25 A
2 Peter 26 A
4 Sophia 27 A
# Sample data
x = [1, 2, 3, 4, 5]
y1 = [2, 3, 5, 7, 11]
plt.figure(figsize=(8, 4))
plt.title('Line Plot')
plt.xlabel('X-axis')
plt.ylabel('Y-axis')
plt.legend()
plt.grid(True)
plt.show()
plt.figure(figsize=(8, 4))
plt.xlabel('X-axis')
plt.ylabel('Y-axis')
plt.legend()
plt.grid(True)
plt.show()
plt.figure(figsize=(8, 4))
plt.title('Bar Plot')
plt.xlabel('X-axis')
plt.ylabel('Y-axis')
plt.legend()
plt.grid(True)
plt.show()
OUTPUT:
Frequency distributors, Averages, Variability
import numpy as np
# Sample data
data = [12, 15, 18, 20, 22, 25, 28, 30, 32, 35, 38, 40, 42, 45, 48]
# Frequency distribution
def frequency_distribution(data):
freq_dict = {}
for item in data:
if item in freq_dict:
freq_dict[item] += 1
else:
freq_dict[item] = 1
return freq_dict
freq_dict = frequency_distribution(data)
print("Frequency Distribution:")
for key, value in freq_dict.items():
print(f"{key}: {value}")
OUTPUT:
Frequency Distribution:
12: 1
15: 1
18: 1
20: 1
22: 1
25: 1
28: 1
30: 1
32: 1
35: 1
38: 1
40: 1
42: 1
45: 1
48: 1
Measures of Variability:
Range: 36
Variance: 118.13333333333334
Standard Deviation: 10.868915922636136
Normal Curves, Correlation and scatter plots, Correlation coefficient
import numpy as np
import matplotlib.pyplot as plt
from scipy.stats import norm
# Scatter plot
plt.figure(figsize=(8, 6))
plt.scatter(x, y, color='blue')
plt.title('Scatter Plot')
plt.xlabel('X')
plt.ylabel('Y')
plt.grid(True)
plt.show()
# Correlation coefficient
correlation_coefficient = np.corrcoef(x, y)[0, 1]
print("Correlation Coefficient:", correlation_coefficient)
plt.title('Normal Curves')
plt.xlabel('Value')
plt.ylabel('Density')
plt.legend()
plt.grid(True)
plt.show()
OUTPUT
Regression python program
import numpy as np
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression
# Sample data
x = np.array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10]).reshape(-1, 1) # Reshape for single feature
y = np.array([2, 3, 5, 7, 11, 13, 17, 19, 23, 29])
# Make predictions
y_pred = model.predict(x)
# Coefficients
print("Intercept:", model.intercept_)
print("Slope:", model.coef_[0])
OUTPUT:
Building and validating linear models
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score
OUTPUT:
Mean Squared Error (MSE): 0.22943831174285717
Coefficient of Determination (R^2): 0.559376074296551
print("Accuracy:", accuracy)
print("Confusion Matrix:\n", conf_matrix)
print("Classification Report:\n", class_report)
OUTPUT:
Accuracy: 1.0
Confusion Matrix:
[[13 0]
[ 0 7]]
Classification Report:
precision recall f1-score support
accuracy 1.00 20
macro avg 1.00 1.00 1.00 20
weighted avg 1.00 1.00 1.00 20