import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
# Load cleaned data
df = pd.read_csv("cleaned_heart_data.csv")
df.head()2. Exploratory Data Analysis (EDA)
Target Distribution
sns.countplot(x='target', data=df)
plt.title("Target Class Distribution")
plt.xlabel("Heart Disease (0 = No, 1 = Yes)")
plt.ylabel("Count")
plt.show()Correlation Heatmap
plt.figure(figsize=(12, 10))
sns.heatmap(df.corr(), annot=True, fmt=".2f", cmap="coolwarm")
plt.title("Correlation Heatmap")
plt.show()Numerical Feature Distributions
num_cols = ['age', 'trestbps', 'chol', 'thalach', 'oldpeak']
df[num_cols].hist(bins=20, figsize=(14, 10))
plt.tight_layout()
plt.show()Pair Plot by Target
sns.pairplot(df[['age', 'chol', 'thalach', 'oldpeak', 'target']], hue='target')
plt.show()