2
import pandas as pd import numpy as np import seaborn as sns import matplotlib.pyplot as plt from sklearn.datasets import fetch_california_housing # Load dataset and convert to DataFrame data = fetch_california_housing() df = pd.DataFrame(data.data, columns=data.feature_names) df['MedHouseVal'] = data.target # Add target column # 1. Correlation Matrix correlation_matrix = df.corr() print("\nCorrelation Matrix:") print(correlation_matrix) # 2. Heatmap of Correlation Matrix plt.figure(figsize=(10, 8)) sns.heatmap(correlation_matrix, annot=True, cmap='coolwarm', fmt='.2f', linewidths=0.5) plt.title('Correlation Matrix of California Housing Features') plt.tight_layout() plt.show() # 3. Pair Plot for Selected Features selected_features = ['MedInc', 'HouseAge', 'AveRooms', 'AveOccup', 'MedHouseVal'] sns.pairplot(df[selected_features], diag_kind='kde', plot_kws={'alpha': 0.5}) plt.suptitle('Pair Plot of Selected California Housing Features', y=1.02) plt.tight_layout() plt.show()
Comments
Post a Comment