Python Code - Summary Statistics
Python Code - Summary Statistics
SRB-30.073034
Problem 1:
import numpy as np
# Mean
mean = np.mean(data)
print("Mean:", mean)
# Median
median = np.median(data)
print("Median:", median)
Problem 2:
#Mode
# Mode
mode = stats.mode(data)
print("Mode:", mode.mode[0])
Problem 3:
import numpy as np
# Range
range_value = np.ptp(data)
print("Range:", range_value)
import numpy as np
# Variance
variance = np.var(data, ddof=1)
print("Variance:", variance)
# Standard Deviation
std_dev = np.std(data, ddof=1)
print("Standard Deviation:", std_dev)
Problem 5:
#Five-Number Summary
import numpy as np
# Five-number summary
minimum = np.min(data)
q1 = np.percentile(data, 25)
median = np.median(data)
q3 = np.percentile(data, 75)
maximum = np.max(data)
print("Five-Number Summary:", [minimum, q1, median, q3, maximum])
Problem 7:
#Z-Score
import numpy as np
# Mean
mean = np.mean(data)
# Standard Deviation
std_dev = np.std(data, ddof=1)
# Z-Score for 45
z_score = (45 - mean) / std_dev
print("Z-Score for 45:", z_score)
Problem 8:
#Correlation
import numpy as np
X = [2, 4, 6, 8, 10]
Y = [1, 2, 3, 4, 5]
# Correlation Coefficient
correlation = np.corrcoef(X, Y)[0, 1]
print("Correlation Coefficient:", correlation)
Problem 9:
#Covariance
import numpy as np
X = [1, 3, 5, 7, 9]
Y = [2, 4, 6, 8, 10]
# Covariance
covariance = np.cov(X, Y)[0, 1]
print("Covariance:", covariance)
Problem 10:
#Normal Distribution
mean = 170
std_dev = 10
value = 180
import numpy as np
import matplotlib.pyplot as plt
import numpy as np
import matplotlib.pyplot as plt
# Plotting a histogram
plt.hist(data, bins=8, edgecolor='black', alpha=0.7)
plt.axvline(mean, color='r', linestyle='dashed', linewidth=1,
label=f'Mean: {mean}')
plt.axvline(mean + std_dev, color='g', linestyle='dashed', linewidth=1,
label=f'Standard Deviation: {std_dev}')
plt.axvline(mean - std_dev, color='g', linestyle='dashed', linewidth=1)
plt.legend()
plt.title("Histogram of the Dataset with Mean and Standard Deviation")
plt.xlabel("Value")
plt.ylabel("Frequency")
plt.show()
Problem 7: Z-Score
import numpy as np
import matplotlib.pyplot as plt
import scipy.stats as stats
data = [30, 35, 40, 45, 50, 55, 60]
# Z-Score for 45
z_score = (45 - mean) / std_dev
Problem 8: Correlation
import numpy as np
import matplotlib.pyplot as plt
X = [2, 4, 6, 8, 10]
Y = [1, 2, 3, 4, 5]
# Correlation Coefficient
correlation = np.corrcoef(X, Y)[0, 1]
# Scatter plot
plt.scatter(X, Y)
plt.title(f"Scatter Plot of X and Y (Correlation: {correlation:.2f})")
plt.xlabel("X")
plt.ylabel("Y")
plt.show()
Extra 1:
import numpy as np
import matplotlib.pyplot as plt
# Example data
X = [2, 4, 6, 8, 10]
Y = [1, 2, 3, 4, 5]
# Scatter plot
plt.scatter(X, Y)
plt.title(f"Scatter Plot of X and Y (Correlation: {correlation:.2f})")
plt.xlabel("X")
plt.ylabel("Y")
plt.show()
Extra 2:
import numpy as np
from sklearn.preprocessing import StandardScaler
# Example dataset
data = np.array([[70], [75], [80], [85], [90]])
# Standardization
scaler = StandardScaler()
standardized_data = scaler.fit_transform(data)
Extra 3:
import numpy as np
# Example data
X = [1, 2, 3, 4, 5]
Y = [2, 4, 6, 8, 10]