from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.model_selection import train_test_split

# Load the dataset
whr_df = pd.read_csv('/content/drive/MyDrive/WHR_2023.csv')

# Inspect the first few rows to understand the structure
whr_df

# Convert the regression target ('happiness_score') into classification labels
# We'll use quartiles to create 4 happiness categories: Very Low, Low, High, Very High

# Define quartiles
whr_df['happiness_category'] = pd.qcut(whr_df['happiness_score'],
                                       q=5,
                                       labels=['Very Low', 'Low','Average', 'High', 'Very High'])

# Select features and target
X = whr_df.drop(columns=['happiness_score', 'happiness_category'])
y = whr_df['happiness_category']

# Split into train and test sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42, stratify=y)

# Convert y_train and y_test to numerical labels
y_train_labels = y_train.astype('category').cat.codes
y_test_labels = y_test.astype('category').cat.codes

# Truncated and cleaned up region data to merge
countrydata=pd.read_csv("/content/drive/MyDrive/newcountryvars.csv")

countrydata.head()

# Merge in new data to X_train and X_test by taking "country" from first table and "country_name" from 2nd table.
# Also check which countries are common in both the datasets, and which type of merge will you perform for the best results.
# Hint: Look on the 'how' parameter of megre function of pandas.

# for our use case, we used the left join to do the merging, this is because we do not lose any of our original data. furthermore,
# countries missing from the country data just get missing values for new features introduced at merge. we deduplicate to remove the redundant
# columns introduced by the merge,

X_train = X_train.merge(countrydata,
                        left_on='country',
                        right_on='country_name',
                        how='left')

X_test = X_test.merge(countrydata,
                      left_on='country',
                      right_on='country_name',
                      how='left')

DUPLICATE_COLS = [
    'country_name',
    'region_y',
    'gdp_per_capita_y',
    'social_support_y',
    'healthy_life_expectancy_y',
    'freedom_to_make_life_choices_y',
    'generosity_y',
    'perceptions_of_corruption_y',
    'happiness_score_y',
    'happiness_category_y',
]

X_train = X_train.drop(columns=[c for c in DUPLICATE_COLS if c in X_train.columns])
X_test  = X_test.drop(columns=[c for c in DUPLICATE_COLS if c in X_test.columns])

RENAME_MAP = {
    'region_x':                       'region',
    'gdp_per_capita_x':               'gdp_per_capita',
    'social_support_x':               'social_support',
    'healthy_life_expectancy_x':      'healthy_life_expectancy',
    'freedom_to_make_life_choices_x': 'freedom_to_make_life_choices',
    'generosity_x':                   'generosity',
    'perceptions_of_corruption_x':    'perceptions_of_corruption',
    'happiness_score_x':              'happiness_score',
    'happiness_category_x':           'happiness_category',
}

X_train = X_train.rename(columns={k: v for k, v in RENAME_MAP.items()
                                   if k in X_train.columns})
X_test  = X_test.rename(columns={k: v for k, v in RENAME_MAP.items()
                                   if k in X_test.columns})

print("X_train shape:", X_train.shape)
print("X_test  shape:", X_test.shape)

X_train shape: (95, 15)
X_test  shape: (42, 15)

X_train.head(150)

print(X_train.dtypes)

country                           object
region                            object
gdp_per_capita                   float64
social_support                   float64
healthy_life_expectancy          float64
freedom_to_make_life_choices     float64
generosity                       float64
perceptions_of_corruption        float64
population                       float64
population_below_poverty_line    float64
hdi                              float64
life_expectancy                  float64
expected_years_of_schooling      float64
mean_years_of_schooling          float64
gni                              float64
dtype: object

# Your code here: TODO
# update - consider merged, we have tons of missing values for the newcountrys
missing = X_train.isnull().sum()
missing_percent = 100 * missing / len(X_train)
missing_table = pd.concat([missing, missing_percent], axis=1)
missing_table

print(missing_percent)
# print(missing_table)

missing_df = pd.DataFrame({
    'Missing Values': missing,
    'Percentage (%)': missing_percent
}).sort_values(by='Missing Values', ascending=False)
print("Missing Values Summary Train Set:")
display(missing_df[missing_df['Missing Values'] > 0])

missing_test = X_test.isnull().sum()
missing_percent_test = 100 * missing_test / len(X_test)
missing_table = pd.concat([missing_test, missing_percent_test], axis=1)
missing_table
#print(missing_percent_test)
missing_df2 = pd.DataFrame({
    'Missing Values': missing_test,
    'Percentage (%)': missing_percent_test
}).sort_values(by='Missing Values', ascending=False)
print("Missing Values Summary Test Set:")
display(missing_df2[missing_df2['Missing Values'] > 0])

country                           0.000000
region                            0.000000
gdp_per_capita                    0.000000
social_support                    0.000000
healthy_life_expectancy           0.000000
freedom_to_make_life_choices      0.000000
generosity                        0.000000
perceptions_of_corruption         0.000000
population                        6.315789
population_below_poverty_line    16.842105
hdi                               6.315789
life_expectancy                   7.368421
expected_years_of_schooling       7.368421
mean_years_of_schooling           7.368421
gni                               7.368421
dtype: float64
Missing Values Summary Train Set:

Missing Values Summary Test Set:

# Your plotting code here: TODO
# key numerical values ---gdp_per_capita	social_support	healthy_life_expectancy
# freedom_to_make_life_choices	generosity	perceptions_of_corruption
#population_x, population_y	population_below_poverty_line_y	hdi_y	life_expectancy_y
# going with features that influence the levels of happiness

num_cols = X_train.select_dtypes(include=['float64', 'int64']).columns.tolist()
key_features = [c for c in num_cols if c in [
    'gdp_per_capita',
    'social_support',
    'healthy_life_expectancy',
    'freedom_to_make_life_choices',
    'generosity',
    'perceptions_of_corruption'
]][:6]

if not key_features:
    key_features = num_cols[:6]

# Histograms
fig, axes = plt.subplots(3, 2, figsize=(12, 8))
axes = axes.flatten()
for i, col in enumerate(key_features):
    if i < len(axes):
        axes[i].hist(X_train[col].dropna(), bins=20, edgecolor='black', alpha=0.7)
        axes[i].set_title(col)
        axes[i].set_xlabel(col)
plt.tight_layout()
plt.suptitle('Distribution of Key Numerical Features (Training Set)', y=1.02)
plt.show()

# Your plotting code(s) here: TODO
import matplotlib.pyplot as plt
import seaborn as sns
import pandas as pd
from IPython.display import display

fig, axes = plt.subplots(1, 2, figsize=(18, 5))
category_order = ['Very Low', 'Low', 'Average', 'High', 'Very High']
label_counts   = y_train.value_counts().reindex(category_order, fill_value=0)
total          = label_counts.sum()
bars = axes[1].bar(
    label_counts.index,
    label_counts.values,
    color=sns.color_palette('RdYlGn', len(category_order)),
    edgecolor='black',
    linewidth=0.8,
)

for bar, count in zip(bars, label_counts.values):
   pct = 100 * count / total
   axes[1].text(
        bar.get_x() + bar.get_width() / 2,
        bar.get_height() + 0.2,
        f'{count}\n({pct:.1f}%)',
        ha='center', va='bottom', fontsize=9,
    )

axes[1].set_title('Target Class Distribution\n(Happiness Category — Training Set)',
                  fontsize=12, fontweight='bold')
axes[1].set_xlabel('Happiness Category', fontsize=10)
axes[1].set_ylabel('Number of Countries', fontsize=10)
axes[1].set_ylim(0, label_counts.max() + 5)


region_counts = X_train['region'].value_counts().sort_values(ascending=True)

axes[0].barh(
    region_counts.index,
    region_counts.values,
    color=sns.color_palette('Set2', len(region_counts)),
    edgecolor='black',
    linewidth=0.8,
)

# Annotate with count so exact numbers are readable without gridlines
for idx, count in enumerate(region_counts.values):
    axes[0].text(count + 0.1, idx, str(count), va='center', fontsize=9)

axes[0].set_title('Geographic Distribution\n(Region — Training Set)',
                  fontsize=12, fontweight='bold')
axes[0].set_xlabel('Number of Countries', fontsize=10)
axes[0].set_xlim(0, region_counts.max() + 4)

(0.0, 27.0)

# Your code here: TODO
import matplotlib.pyplot as plt
import seaborn as sns
import pandas as pd
import numpy as np

num_cols = X_train.select_dtypes(include=['float64', 'int64']).columns.tolist()
num_df = X_train[num_cols].dropna()

pearson_correlation = num_df.corr(method='pearson')
spearman_correlation = num_df.corr(method='spearman')
kendall_correlation = num_df.corr(method='kendall')

fig, axes = plt.subplots(1, 3, figsize=(36, 8))

for i, corr_df in enumerate([pearson_correlation, spearman_correlation, kendall_correlation]):
    sns.heatmap(corr_df, annot=True, cmap='coolwarm', ax=axes[i])
    axes[i].set_title(f'Correlation Matrix - {["Pearson", "Spearman", "Kendall"][i]}', fontsize=
                      12, fontweight='bold')

plt.tight_layout()
plt.show()

# Print top correlations (Spearman — most reliable for this dataset since most features are skewed)
print("Top 10 Spearman correlations (excluding self-correlations):")
spearman_pairs = (
    spearman_correlation.where(~np.eye(len(spearman_correlation), dtype=bool))
    .stack()
    .abs()
    .sort_values(ascending=False)
)
print(spearman_pairs.head(10).to_string())

Top 10 Spearman correlations (excluding self-correlations):
hdi                          gni                            0.972306
gni                          hdi                            0.972306
life_expectancy              healthy_life_expectancy        0.958141
healthy_life_expectancy      life_expectancy                0.958141
expected_years_of_schooling  hdi                            0.953793
hdi                          expected_years_of_schooling    0.953793
gdp_per_capita               gni                            0.953552
gni                          gdp_per_capita                 0.953552
hdi                          gdp_per_capita                 0.940337
gdp_per_capita               hdi                            0.940337

# Bivariate Analysis and Relationship Exploration
import matplotlib.pyplot as plt
import seaborn as sns
import pandas as pd
import numpy as np

temp = X_train.copy()
temp['happiness_category'] = y_train
category = ['Very Low', 'Low', 'Average', 'High', 'Very High']

key_features = [c for c in num_cols if c in [
    'gdp_per_capita', 'social_support', 'healthy_life_expectancy',
    'freedom_to_make_life_choices', 'generosity', 'perceptions_of_corruption',
    'hdi', 'life_expectancy', 'population_below_poverty_line', 'population'
]][:9]

# Correlation table and heatmap
corr_df = temp[key_features + ['happiness_category']].copy()
# encode target for correlation
target_numeric = pd.Categorical(corr_df['happiness_category'], categories=category, ordered=True).codes
corr_df = corr_df[key_features].assign(happiness_category=target_numeric)
corr = corr_df.corr()

fig, ax = plt.subplots(figsize=(12, 10))
sns.heatmap(corr, annot=True, fmt='.2f', cmap='RdBu_r', center=0, square=True, linewidths=0.5, ax=ax)
ax.set_title('Correlation Table (Key Features + Target)', fontsize=14, fontweight='bold')
plt.tight_layout()
plt.show()

print("Correlation with target (happiness_category):")
print(corr['happiness_category'].drop('happiness_category').sort_values(ascending=False).round(3).to_string())

# Box plots: feature distributions across target classes
fig, axes = plt.subplots(3, 3, figsize=(18, 15))
axes = axes.flatten()
for i, col in enumerate(key_features):
    sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
    axes[i].set_title(f'{col} by Happiness Category', fontsize=12, fontweight='bold')
    axes[i].set_xlabel('Happiness Category')
    axes[i].tick_params(axis='x', rotation=45)
for j in range(len(key_features), len(axes)):
    fig.delaxes(axes[j])
plt.suptitle('Bivariate Analysis: Box Plots (Feature vs Target)', fontsize=16, fontweight='bold', y=1.02)
plt.tight_layout()
plt.show()

# Scatter/strip: feature vs target
fig, axes = plt.subplots(3, 3, figsize=(18, 15))
axes = axes.flatten()
for i, col in enumerate(key_features):
    sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
    axes[i].set_title(f'{col} vs Happiness Category', fontsize=12, fontweight='bold')
    axes[i].set_xlabel('Happiness Category')
    axes[i].tick_params(axis='x', rotation=45)
for j in range(len(key_features), len(axes)):
    fig.delaxes(axes[j])
plt.suptitle('Bivariate Analysis: Scatter Distribution of Key Features', fontsize=16, fontweight='bold', y=1.02)
plt.tight_layout()
plt.show()

# Distribution comparison: KDE by target for key features
fig, axes = plt.subplots(3, 3, figsize=(18, 15))
axes = axes.flatten()
for i, col in enumerate(key_features):
    for cat in category:
        subset = temp.loc[temp['happiness_category'] == cat, col].dropna()
        axes[i].hist(subset, bins=15, alpha=0.5, label=cat, density=True)
    axes[i].set_title(f'{col} by Happiness Category', fontsize=12, fontweight='bold')
    axes[i].set_xlabel(col)
    axes[i].set_ylabel('Density')
    axes[i].legend(loc='upper right', fontsize=8)
for j in range(len(key_features), len(axes)):
    fig.delaxes(axes[j])
plt.suptitle('Feature Distributions Across Target Classes', fontsize=16, fontweight='bold', y=1.02)
plt.tight_layout()
plt.show()

#  Grouped bar charts (categorical features vs target)
cat_cols = [c for c in temp.columns if c not in num_cols and c != 'happiness_category' and temp[c].dtype in ['object', 'category']]
if cat_cols:
    n_cat = min(len(cat_cols), 4)
    fig, axes = plt.subplots(2, 2, figsize=(48, 12))
    axes = axes.flatten()
    for i, col in enumerate(cat_cols[:n_cat]):
        ct = pd.crosstab(temp[col], temp['happiness_category'])
        ct = ct.reindex(columns=category, fill_value=0)
        ct.plot(kind='bar', ax=axes[i], colormap='RdYlGn', edgecolor='black')
        axes[i].set_title(f'{col} vs Happiness Category', fontsize=12, fontweight='bold')
        axes[i].set_xlabel(col)
        axes[i].set_ylabel('Count')
        axes[i].legend(title='Happiness', bbox_to_anchor=(1.02, 1), loc='upper left')
        axes[i].tick_params(axis='x', rotation=45)
    for j in range(n_cat, len(axes)):
        fig.delaxes(axes[j])
    plt.suptitle('Grouped Bar Charts: Categorical Features vs Target', fontsize=16, fontweight='bold', y=1.02)
    plt.tight_layout()
    plt.show()
else:
    print("No categorical features found for grouped bar charts.")

Correlation with target (happiness_category):
perceptions_of_corruption        0.189
population_below_poverty_line    0.160
hdi                              0.083
social_support                   0.078
gdp_per_capita                   0.059
generosity                       0.058
healthy_life_expectancy          0.043
freedom_to_make_life_choices    -0.046
population                      -0.180

/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])
/tmp/ipykernel_19057/2757820991.py:37: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.boxplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', ax=axes[i])

/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)
/tmp/ipykernel_19057/2757820991.py:51: FutureWarning: 

Passing `palette` without assigning `hue` is deprecated and will be removed in v0.14.0. Assign the `x` variable to `hue` and set `legend=False` for the same effect.

  sns.stripplot(data=temp, x='happiness_category', y=col, order=category, palette='RdYlGn', jitter=0.25, size=6, alpha=0.6, ax=axes[i], edgecolor='black', linewidth=0.5)

/usr/local/lib/python3.12/dist-packages/numpy/lib/_histograms_impl.py:895: RuntimeWarning: invalid value encountered in divide
  return n/db/n.sum(), bin_edges

# Your code here: TODO
import pandas as pd
from IPython.display import display
from scipy import stats
import numpy as np


numeric_cols = X_train.select_dtypes(include=['float64', 'int64']).columns
plt.figure(figsize=(18, 10))

X_train[numeric_cols].boxplot(rot=45)
plt.title('Outlier Identification: Global Boxplot View', fontsize=14, fontweight='bold')
plt.show()

# Interquartile Range (IQR) Method
def detect_outliers_iqr(df, features):
    """
    Calculates the outlier count and percentage for specified features using the IQR rule.
    """
    outlier_summary = {}

    for col in features:
        # Calculate the 25th and 75th percentiles
        Q1 = df[col].quantile(0.25)
        Q3 = df[col].quantile(0.75)

        # IQR represents the range where the middle 50% of the data sits
        IQR = Q3 - Q1

        # Calculate boundaries. 1.5 is the standard multiplier for identifying mild outliers.
        lower_bound = Q1 - 1.5 * IQR
        upper_bound = Q3 + 1.5 * IQR

        outliers = df[(df[col] < lower_bound) | (df[col] > upper_bound)]

        outlier_summary[col] = {
            'Count': len(outliers),
            'Percentage (%)': round((len(outliers) / len(df)) * 100, 2)
        }


    return pd.DataFrame(outlier_summary).T

# Detect outliers across all numeric features in X_train
outlier_results = detect_outliers_iqr(X_train, numeric_cols)


print("Outlier Detection Summary Table:")
display(outlier_results[outlier_results['Count'] > 0].sort_values(by='Count', ascending=False))


def detect_outliers_zscore(df, threshold=3):
    """
    Identifies outliers using the Z-score method.
    Standard threshold is 3 (99.7% of data in a normal distribution falls within 3 SD).
    """
    z_scores = np.abs(stats.zscore(df.select_dtypes(include=[np.number])))


    outlier_indices = np.where(z_scores > threshold)


    outlier_list = []
    for row, col in zip(outlier_indices[0], outlier_indices[1]):
        feature_name = df.columns[col]
        value = df.iloc[row, col]
        z_val = z_scores[row, col]
        outlier_list.append([row, feature_name, value, z_val])

    return pd.DataFrame(outlier_list, columns=['Row_Index', 'Feature', 'Value', 'Z-Score'])

z_outliers = detect_outliers_zscore(X_train)

print(f"Total Outliers detected (Z > 3): {len(z_outliers)}")
display(z_outliers.sort_values(by='Z-Score', ascending=False).head(10))

Outlier Detection Summary Table:

Total Outliers detected (Z > 3): 5

# Your code here: TODO
import pandas as pd
import numpy as np

num_cols = X_train.select_dtypes(include=['float64', 'int64']).columns.tolist()
skewed_features = [col for col in num_cols if X_train[col].skew() > 0] # review

for col in skewed_features:
    X_train[col] = np.log1p(X_train[col])
    X_test[col] = np.log1p(X_test[col])

if len(skewed_features) > 0:
    print(f"Skewed features after log transformation -train set: {', '.join(skewed_features)}")
    print(X_train[skewed_features].describe())

if len(skewed_features) > 0:
    print(f"Skewed features after log transformation - test set: {', '.join(skewed_features)}")
    print(X_test[skewed_features].describe())

Skewed features after log transformation -train set: generosity, perceptions_of_corruption, population, population_below_poverty_line, gni
       generosity  perceptions_of_corruption  population  \
count   95.000000                  95.000000   89.000000   
mean     0.143291                   0.130229   16.436721   
std      0.061651                   0.107665    1.613574   
min      0.007968                   0.000000   12.721963   
25%      0.100298                   0.057325   15.510697   
50%      0.131905                   0.098940   16.578716   
75%      0.187309                   0.158284   17.391769   
max      0.352064                   0.445327   21.066513   

       population_below_poverty_line        gni  
count                      79.000000  88.000000  
mean                        3.152901   9.203528  
std                         0.624395   1.224096  
min                         1.458615   6.527359  
25%                         2.772589   8.164017  
50%                         3.152736   9.384480  
75%                         3.593118  10.211987  
max                         4.294561  11.266556  
Skewed features after log transformation - test set: generosity, perceptions_of_corruption, population, population_below_poverty_line, gni
       generosity  perceptions_of_corruption  population  \
count   42.000000                  42.000000   39.000000   
mean     0.120502                   0.131557   16.538485   
std      0.070842                   0.094699    1.370300   
min      0.000000                   0.002996   14.521148   
25%      0.076960                   0.064148   15.391015   
50%      0.110643                   0.121313   16.260647   
75%      0.163361                   0.181693   17.571327   
max      0.336472                   0.388658   19.597671   

       population_below_poverty_line        gni  
count                      39.000000  39.000000  
mean                        3.046495   9.344038  
std                         0.611242   1.071450  
min                         1.308333   7.002552  
25%                         2.791090   8.524843  
50%                         3.135494   9.496464  
75%                         3.462429  10.029360  
max                         4.099332  11.100501

# Your code here: TODO
X_train['interaction_feature1'] = X_train['generosity'] * X_train['perceptions_of_corruption']
X_test['interaction_feature1'] = X_test['generosity'] * X_test['perceptions_of_corruption']


# Check X_train results
display(X_train[['generosity', 'perceptions_of_corruption', 'interaction_feature1']].head())

# Check X_test results
display(X_test[['generosity', 'perceptions_of_corruption', 'interaction_feature1']].head())

from sklearn.preprocessing import StandardScaler, OneHotEncoder
from sklearn.compose import ColumnTransformer, make_column_transformer
from sklearn.pipeline import Pipeline
from sklearn.impute import SimpleImputer

# Create the preprocessing pipelines for both numeric and categorical data.

# Dynamically identify numeric and categorical features
# Exclude 'country' as it's an identifier used for merging, not a feature to be encoded/scaled.
numeric_features = X_train.select_dtypes(include=['float64', 'int64']).columns.tolist()
categorical_features = X_train.select_dtypes(include=['object']).columns.tolist()

# Remove 'country' from categorical features if it's there, as it's typically dropped or handled differently
if 'country' in categorical_features:
    categorical_features.remove('country')

# Numeric transformer: impute missing numerical values with the mean, then scale
numeric_transformer = Pipeline(steps=[
    ('imputer', SimpleImputer(strategy='mean')),
    ('scaler', StandardScaler())])

# Categorical transformer: impute missing categorical values with the most frequent, then one-hot encode
categorical_transformer = Pipeline(steps=[
    ('imputer', SimpleImputer(strategy='most_frequent')),
    ('onehot', OneHotEncoder(handle_unknown='ignore'))])

# final preprocessor object set up with ColumnTransformer
preprocessor = ColumnTransformer(
    transformers=[
        ('num', numeric_transformer, numeric_features),
        ('cat', categorical_transformer, categorical_features)
    ],
    remainder='drop' # Changed from 'passthrough' to 'drop'
)

#Fit your preprocessor object
preprocess=preprocessor.fit(X_train)

# function to transform data with preprocessor
def preprocessor(data):
    preprocessed_data = preprocess.transform(data)
    return preprocessed_data

# check shape of X data after preprocessing it using our new function
preprocessor(X_train).shape

(95, 24)

from sklearn.ensemble import RandomForestClassifier

X_train_proc = preprocess.transform(X_train)
X_test_proc  = preprocess.transform(X_test)

if hasattr(X_train_proc, "toarray"):
    X_train_proc = X_train_proc.toarray()
    X_test_proc  = X_test_proc.toarray()

model = RandomForestClassifier(
    n_estimators=300,
    random_state=42,
    n_jobs=-1)

model.fit(X_train_proc, y_train)

# Score (accuracy in [0,1])
test_score = model.score(X_test_proc, y_test)
test_score

0.5714285714285714

import os
import pickle

os.makedirs("artifacts", exist_ok=True)

with open("artifacts/preprocess.pkl", "wb") as f:
    pickle.dump(preprocess, f)

with open("artifacts/random_forest_model.pkl", "wb") as f:
    pickle.dump(model, f)

print("Saved:")
print(" - artifacts/preprocess.pkl")
print(" - artifacts/random_forest_model.pkl")

Saved:
 - artifacts/preprocess.pkl
 - artifacts/random_forest_model.pkl

from sklearn.metrics import accuracy_score, confusion_matrix, classification_report

# -- Generate predicted values (Model 1)
prediction_labels = model.predict(preprocessor(X_test))

# -- Evaluate model performance
accuracy = accuracy_score(y_test, prediction_labels)
print("Accuracy:", accuracy)

print("\nConfusion Matrix:")
print(confusion_matrix(y_test, prediction_labels))

print("\nClassification Report:")
print(classification_report(y_test, prediction_labels))

# Write lines of code to show model performance by comparing prediction_labels with true labels: TODO

Accuracy: 0.5714285714285714

Confusion Matrix:
[[5 1 2 0 0]
 [2 5 0 1 0]
 [0 0 5 0 3]
 [1 2 0 6 0]
 [0 0 6 0 3]]

Classification Report:
              precision    recall  f1-score   support

     Average       0.62      0.62      0.62         8
        High       0.62      0.62      0.62         8
         Low       0.38      0.62      0.48         8
   Very High       0.86      0.67      0.75         9
    Very Low       0.50      0.33      0.40         9

    accuracy                           0.57        42
   macro avg       0.60      0.57      0.58        42
weighted avg       0.60      0.57      0.58        42

from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report

# Train model 2 using same preprocessor
model_2 = RandomForestClassifier(
    n_estimators=500,
    max_depth=8,
    min_samples_split=4,
    min_samples_leaf=2,
    random_state=42,
    n_jobs=-1)

model_2.fit(X_train_proc, y_train)

RandomForestClassifier(max_depth=8, min_samples_leaf=2, min_samples_split=4,
                       n_estimators=500, n_jobs=-1, random_state=42)

RandomForestClassifier(max_depth=8, min_samples_leaf=2, min_samples_split=4,
                       n_estimators=500, n_jobs=-1, random_state=42)

# -- Generate predicted y values (Model 2)
prediction_labels_2 = model_2.predict(X_test_proc)

# -- Show model 2 performance
accuracy_2 = accuracy_score(y_test, prediction_labels_2)
print("Model 2 Accuracy:", accuracy_2)

print("\nModel 2 Confusion Matrix:")
print(confusion_matrix(y_test, prediction_labels_2))

print("\nModel 2 Classification Report:")
print(classification_report(y_test, prediction_labels_2))

Model 2 Accuracy: 0.5952380952380952

Model 2 Confusion Matrix:
[[6 1 1 0 0]
 [2 5 0 1 0]
 [1 0 4 0 3]
 [1 2 0 6 0]
 [0 0 5 0 4]]

Model 2 Classification Report:
              precision    recall  f1-score   support

     Average       0.60      0.75      0.67         8
        High       0.62      0.62      0.62         8
         Low       0.40      0.50      0.44         8
   Very High       0.86      0.67      0.75         9
    Very Low       0.57      0.44      0.50         9

    accuracy                           0.60        42
   macro avg       0.61      0.60      0.60        42
weighted avg       0.62      0.60      0.60        42

print("Model 1 Accuracy:", accuracy)
print("Model 2 Accuracy:", accuracy_2)

Model 1 Accuracy: 0.5714285714285714
Model 2 Accuracy: 0.5952380952380952

from sklearn.ensemble import RandomForestClassifier
from sklearn.model_selection import GridSearchCV
import numpy as np

# Parameter grid
param_grid = {
    'n_estimators': np.arange(200, 601, 100),
    'max_depth': [6, 8, 10, None],
    'min_samples_split': np.arange(2, 7, 2),
    'min_samples_leaf': np.arange(1, 4, 1)
}

# Base model
rf = RandomForestClassifier(random_state=42, n_jobs=-1)

# GridSearchCV object
gridmodel = GridSearchCV(
    estimator=rf,
    param_grid=param_grid,
    cv=5,
    scoring='accuracy',
    n_jobs=-1)

# Fit on preprocessed training data
gridmodel.fit(X_train_proc, y_train)

# Best result
print("best mean cross-validation score: {:.3f}".format(gridmodel.best_score_))
print("best parameters: {}".format(gridmodel.best_params_))

best mean cross-validation score: 0.568
best parameters: {'max_depth': 6, 'min_samples_leaf': np.int64(1), 'min_samples_split': np.int64(4), 'n_estimators': np.int64(300)}

from sklearn.metrics import accuracy_score, confusion_matrix, classification_report

# Make predictions using best model
prediction_labels_3 = gridmodel.best_estimator_.predict(X_test_proc)

# Evaluate Model 3
accuracy_3 = accuracy_score(y_test, prediction_labels_3)
print("Model 3 Accuracy:", accuracy_3)

print("\nModel 3 Confusion Matrix:")
print(confusion_matrix(y_test, prediction_labels_3))

print("\nModel 3 Classification Report:")
print(classification_report(y_test, prediction_labels_3))

Model 3 Accuracy: 0.6190476190476191

Model 3 Confusion Matrix:
[[6 1 1 0 0]
 [2 5 0 1 0]
 [0 0 5 0 3]
 [1 2 0 6 0]
 [0 0 5 0 4]]

Model 3 Classification Report:
              precision    recall  f1-score   support

     Average       0.67      0.75      0.71         8
        High       0.62      0.62      0.62         8
         Low       0.45      0.62      0.53         8
   Very High       0.86      0.67      0.75         9
    Very Low       0.57      0.44      0.50         9

    accuracy                           0.62        42
   macro avg       0.63      0.62      0.62        42
weighted avg       0.64      0.62      0.62        42

print("Model 1 Accuracy:", accuracy)
print("Model 2 Accuracy:", accuracy_2)
print("Model 3 Accuracy:", accuracy_3)

Model 1 Accuracy: 0.5714285714285714
Model 2 Accuracy: 0.5952380952380952
Model 3 Accuracy: 0.6190476190476191

from sklearn.ensemble import GradientBoostingClassifier
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report

model_4 = GradientBoostingClassifier(
    n_estimators=300,
    learning_rate=0.01,
    max_depth=3,
    random_state=42)

model_4.fit(X_train_proc, y_train)

prediction_labels_4 = model_4.predict(X_test_proc)

accuracy_4 = accuracy_score(y_test, prediction_labels_4)
print("Model 4 Accuracy:", accuracy_4)

print("\nModel 4 Confusion Matrix:")
print(confusion_matrix(y_test, prediction_labels_4))

print("\nModel 4 Classification Report:")
print(classification_report(y_test, prediction_labels_4))

Model 4 Accuracy: 0.5

Model 4 Confusion Matrix:
[[3 4 1 0 0]
 [2 4 0 2 0]
 [1 0 4 0 3]
 [0 3 0 6 0]
 [1 0 4 0 4]]

Model 4 Classification Report:
              precision    recall  f1-score   support

     Average       0.43      0.38      0.40         8
        High       0.36      0.50      0.42         8
         Low       0.44      0.50      0.47         8
   Very High       0.75      0.67      0.71         9
    Very Low       0.57      0.44      0.50         9

    accuracy                           0.50        42
   macro avg       0.51      0.50      0.50        42
weighted avg       0.52      0.50      0.50        42

# Now experiment with deep learning models:
import keras
from keras.models import Sequential
from keras.layers import Dense, Dropout, BatchNormalization
from keras.utils import to_categorical
import numpy as np

# Preprocess input features
X_train_nn = preprocess.transform(X_train)
X_test_nn  = preprocess.transform(X_test)

if hasattr(X_train_nn, "toarray"):
    X_train_nn = X_train_nn.toarray()
    X_test_nn  = X_test_nn.toarray()

# Count features in input data
feature_count = X_train_nn.shape[1]
print(f"Feature count: {feature_count}")

# Encode categorical labels as one-hot vectors
# y_train categories: Very Low=0, Low=1, Average=2, High=3, Very High=4
category_order = ["Very Low", "Low", "Average", "High", "Very High"]
y_train_cat = pd.Categorical(y_train, categories=category_order, ordered=True)
y_test_cat  = pd.Categorical(y_test,  categories=category_order, ordered=True)

y_train_ohe = to_categorical(y_train_cat.codes, num_classes=5)
y_test_ohe  = to_categorical(y_test_cat.codes,  num_classes=5)

num_classes = 5  # Very Low, Low, Average, High, Very High

# Define Neural Network: 5 layers 128->64->64->32->5
keras_model = Sequential([
    Dense(128, input_dim=feature_count, activation="relu"),
    Dense(64,  activation="relu"),
    Dense(64,  activation="relu"),
    Dense(32,  activation="relu"),
    Dense(num_classes, activation="softmax")  # 5 output neurons, one per class
])

keras_model.summary()

# Compile model
keras_model.compile(loss="categorical_crossentropy", optimizer="sgd", metrics=["accuracy"])

# Fit model — pass one-hot encoded y
history = keras_model.fit(
    X_train_nn, y_train_ohe,
    batch_size=20,
    epochs=300,
    validation_split=0.25,
    verbose=1
)

Feature count: 24

/usr/local/lib/python3.12/dist-packages/keras/src/layers/core/dense.py:93: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ dense (Dense)                   │ (None, 128)            │         3,200 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_1 (Dense)                 │ (None, 64)             │         8,256 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_2 (Dense)                 │ (None, 64)             │         4,160 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_3 (Dense)                 │ (None, 32)             │         2,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_4 (Dense)                 │ (None, 5)              │           165 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 17,861 (69.77 KB)

 Trainable params: 17,861 (69.77 KB)

 Non-trainable params: 0 (0.00 B)

Epoch 1/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 1s 111ms/step - accuracy: 0.1749 - loss: 1.5958 - val_accuracy: 0.1250 - val_loss: 1.5997
Epoch 2/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.1616 - loss: 1.5905 - val_accuracy: 0.2083 - val_loss: 1.5947
Epoch 3/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.2706 - loss: 1.5742 - val_accuracy: 0.2083 - val_loss: 1.5899
Epoch 4/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.3644 - loss: 1.5579 - val_accuracy: 0.1667 - val_loss: 1.5850
Epoch 5/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.4640 - loss: 1.5390 - val_accuracy: 0.1667 - val_loss: 1.5796
Epoch 6/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.4953 - loss: 1.5293 - val_accuracy: 0.1667 - val_loss: 1.5747
Epoch 7/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5562 - loss: 1.5114 - val_accuracy: 0.2083 - val_loss: 1.5699
Epoch 8/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.5105 - loss: 1.5076 - val_accuracy: 0.2500 - val_loss: 1.5647
Epoch 9/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.4622 - loss: 1.5028 - val_accuracy: 0.2500 - val_loss: 1.5596
Epoch 10/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5424 - loss: 1.4783 - val_accuracy: 0.2500 - val_loss: 1.5535
Epoch 11/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5972 - loss: 1.4521 - val_accuracy: 0.2917 - val_loss: 1.5475
Epoch 12/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.4572 - loss: 1.4613 - val_accuracy: 0.2917 - val_loss: 1.5422
Epoch 13/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.5358 - loss: 1.4353 - val_accuracy: 0.2917 - val_loss: 1.5367
Epoch 14/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.4985 - loss: 1.4349 - val_accuracy: 0.2917 - val_loss: 1.5308
Epoch 15/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.4901 - loss: 1.4187 - val_accuracy: 0.2917 - val_loss: 1.5249
Epoch 16/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.4728 - loss: 1.4142 - val_accuracy: 0.2917 - val_loss: 1.5186
Epoch 17/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.4388 - loss: 1.4007 - val_accuracy: 0.2917 - val_loss: 1.5127
Epoch 18/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5172 - loss: 1.3574 - val_accuracy: 0.2917 - val_loss: 1.5066
Epoch 19/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.5255 - loss: 1.3569 - val_accuracy: 0.2917 - val_loss: 1.5008
Epoch 20/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5212 - loss: 1.3307 - val_accuracy: 0.2917 - val_loss: 1.4954
Epoch 21/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5288 - loss: 1.3080 - val_accuracy: 0.2917 - val_loss: 1.4902
Epoch 22/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.4822 - loss: 1.3206 - val_accuracy: 0.2917 - val_loss: 1.4839
Epoch 23/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5005 - loss: 1.3221 - val_accuracy: 0.2917 - val_loss: 1.4779
Epoch 24/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.4838 - loss: 1.2906 - val_accuracy: 0.2917 - val_loss: 1.4725
Epoch 25/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.4795 - loss: 1.2894 - val_accuracy: 0.2917 - val_loss: 1.4670
Epoch 26/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.5112 - loss: 1.2525 - val_accuracy: 0.2917 - val_loss: 1.4612
Epoch 27/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.4778 - loss: 1.2609 - val_accuracy: 0.2917 - val_loss: 1.4558
Epoch 28/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5278 - loss: 1.2337 - val_accuracy: 0.2917 - val_loss: 1.4507
Epoch 29/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5505 - loss: 1.2270 - val_accuracy: 0.2917 - val_loss: 1.4450
Epoch 30/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.4655 - loss: 1.2476 - val_accuracy: 0.2917 - val_loss: 1.4407
Epoch 31/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.5155 - loss: 1.2115 - val_accuracy: 0.2917 - val_loss: 1.4373
Epoch 32/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 46ms/step - accuracy: 0.4845 - loss: 1.2270 - val_accuracy: 0.2917 - val_loss: 1.4329
Epoch 33/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.5362 - loss: 1.1746 - val_accuracy: 0.2917 - val_loss: 1.4279
Epoch 34/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.5638 - loss: 1.1439 - val_accuracy: 0.2917 - val_loss: 1.4243
Epoch 35/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.5055 - loss: 1.1647 - val_accuracy: 0.2917 - val_loss: 1.4205
Epoch 36/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 38ms/step - accuracy: 0.4718 - loss: 1.1835 - val_accuracy: 0.2917 - val_loss: 1.4174
Epoch 37/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 36ms/step - accuracy: 0.5105 - loss: 1.1249 - val_accuracy: 0.2917 - val_loss: 1.4149
Epoch 38/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 38ms/step - accuracy: 0.5135 - loss: 1.1198 - val_accuracy: 0.3333 - val_loss: 1.4128
Epoch 39/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 54ms/step - accuracy: 0.5178 - loss: 1.1211 - val_accuracy: 0.2917 - val_loss: 1.4087
Epoch 40/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 52ms/step - accuracy: 0.4845 - loss: 1.1232 - val_accuracy: 0.2917 - val_loss: 1.4061
Epoch 41/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.4968 - loss: 1.0970 - val_accuracy: 0.2917 - val_loss: 1.4038
Epoch 42/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 42ms/step - accuracy: 0.4751 - loss: 1.1131 - val_accuracy: 0.2917 - val_loss: 1.4016
Epoch 43/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 36ms/step - accuracy: 0.5035 - loss: 1.0739 - val_accuracy: 0.2917 - val_loss: 1.3973
Epoch 44/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.5418 - loss: 1.0571 - val_accuracy: 0.2917 - val_loss: 1.3945
Epoch 45/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 37ms/step - accuracy: 0.5085 - loss: 1.0521 - val_accuracy: 0.2917 - val_loss: 1.3919
Epoch 46/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 35ms/step - accuracy: 0.5401 - loss: 1.0652 - val_accuracy: 0.2917 - val_loss: 1.3898
Epoch 47/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 37ms/step - accuracy: 0.4885 - loss: 1.0797 - val_accuracy: 0.2917 - val_loss: 1.3880
Epoch 48/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 41ms/step - accuracy: 0.5151 - loss: 1.0533 - val_accuracy: 0.3333 - val_loss: 1.3856
Epoch 49/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 46ms/step - accuracy: 0.5418 - loss: 0.9920 - val_accuracy: 0.3333 - val_loss: 1.3844
Epoch 50/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 40ms/step - accuracy: 0.4851 - loss: 1.0495 - val_accuracy: 0.3333 - val_loss: 1.3821
Epoch 51/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.5485 - loss: 1.0080 - val_accuracy: 0.3333 - val_loss: 1.3792
Epoch 52/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 34ms/step - accuracy: 0.5191 - loss: 1.0036 - val_accuracy: 0.3333 - val_loss: 1.3769
Epoch 53/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5068 - loss: 1.0156 - val_accuracy: 0.3333 - val_loss: 1.3758
Epoch 54/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5624 - loss: 0.9695 - val_accuracy: 0.3333 - val_loss: 1.3744
Epoch 55/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5647 - loss: 0.9912 - val_accuracy: 0.3333 - val_loss: 1.3724
Epoch 56/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6154 - loss: 0.9421 - val_accuracy: 0.3333 - val_loss: 1.3707
Epoch 57/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 42ms/step - accuracy: 0.5816 - loss: 0.9877 - val_accuracy: 0.3333 - val_loss: 1.3676
Epoch 58/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5466 - loss: 1.0384 - val_accuracy: 0.3333 - val_loss: 1.3669
Epoch 59/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.5570 - loss: 0.9650 - val_accuracy: 0.3333 - val_loss: 1.3652
Epoch 60/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5354 - loss: 0.9951 - val_accuracy: 0.3333 - val_loss: 1.3648
Epoch 61/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.5593 - loss: 0.9444 - val_accuracy: 0.3333 - val_loss: 1.3634
Epoch 62/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5120 - loss: 0.9837 - val_accuracy: 0.3333 - val_loss: 1.3635
Epoch 63/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5777 - loss: 0.9636 - val_accuracy: 0.3750 - val_loss: 1.3611
Epoch 64/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5404 - loss: 0.9594 - val_accuracy: 0.3750 - val_loss: 1.3594
Epoch 65/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.5220 - loss: 1.0003 - val_accuracy: 0.3750 - val_loss: 1.3575
Epoch 66/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5927 - loss: 0.9460 - val_accuracy: 0.3750 - val_loss: 1.3548
Epoch 67/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5570 - loss: 0.9214 - val_accuracy: 0.3750 - val_loss: 1.3558
Epoch 68/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5504 - loss: 0.9431 - val_accuracy: 0.3750 - val_loss: 1.3527
Epoch 69/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5877 - loss: 0.9301 - val_accuracy: 0.4167 - val_loss: 1.3524
Epoch 70/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5627 - loss: 0.9150 - val_accuracy: 0.4167 - val_loss: 1.3517
Epoch 71/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6066 - loss: 0.8927 - val_accuracy: 0.4167 - val_loss: 1.3492
Epoch 72/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6243 - loss: 0.8687 - val_accuracy: 0.3750 - val_loss: 1.3481
Epoch 73/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6329 - loss: 0.8909 - val_accuracy: 0.3750 - val_loss: 1.3480
Epoch 74/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6225 - loss: 0.9501 - val_accuracy: 0.3750 - val_loss: 1.3460
Epoch 75/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6083 - loss: 0.9205 - val_accuracy: 0.3333 - val_loss: 1.3482
Epoch 76/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6798 - loss: 0.9059 - val_accuracy: 0.3333 - val_loss: 1.3465
Epoch 77/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6129 - loss: 0.8845 - val_accuracy: 0.3333 - val_loss: 1.3442
Epoch 78/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.7152 - loss: 0.8332 - val_accuracy: 0.3750 - val_loss: 1.3418
Epoch 79/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6908 - loss: 0.8363 - val_accuracy: 0.3333 - val_loss: 1.3408
Epoch 80/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6771 - loss: 0.8390 - val_accuracy: 0.3333 - val_loss: 1.3378
Epoch 81/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5583 - loss: 0.8713 - val_accuracy: 0.3333 - val_loss: 1.3364
Epoch 82/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5796 - loss: 0.9108 - val_accuracy: 0.3750 - val_loss: 1.3345
Epoch 83/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6056 - loss: 0.8929 - val_accuracy: 0.3333 - val_loss: 1.3346
Epoch 84/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6129 - loss: 0.8832 - val_accuracy: 0.2917 - val_loss: 1.3330
Epoch 85/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6696 - loss: 0.8298 - val_accuracy: 0.3750 - val_loss: 1.3340
Epoch 86/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6339 - loss: 0.8502 - val_accuracy: 0.4167 - val_loss: 1.3369
Epoch 87/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6815 - loss: 0.8475 - val_accuracy: 0.4167 - val_loss: 1.3340
Epoch 88/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6465 - loss: 0.8624 - val_accuracy: 0.4167 - val_loss: 1.3361
Epoch 89/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6704 - loss: 0.8436 - val_accuracy: 0.3750 - val_loss: 1.3261
Epoch 90/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6575 - loss: 0.8619 - val_accuracy: 0.3333 - val_loss: 1.3241
Epoch 91/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6825 - loss: 0.8308 - val_accuracy: 0.3333 - val_loss: 1.3224
Epoch 92/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6848 - loss: 0.8319 - val_accuracy: 0.3750 - val_loss: 1.3207
Epoch 93/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6579 - loss: 0.7797 - val_accuracy: 0.3333 - val_loss: 1.3203
Epoch 94/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6681 - loss: 0.8337 - val_accuracy: 0.3333 - val_loss: 1.3179
Epoch 95/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6931 - loss: 0.8118 - val_accuracy: 0.3333 - val_loss: 1.3150
Epoch 96/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6898 - loss: 0.8268 - val_accuracy: 0.3750 - val_loss: 1.3152
Epoch 97/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6648 - loss: 0.8055 - val_accuracy: 0.4583 - val_loss: 1.3058
Epoch 98/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6216 - loss: 0.8231 - val_accuracy: 0.4167 - val_loss: 1.3073
Epoch 99/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6669 - loss: 0.7972 - val_accuracy: 0.3750 - val_loss: 1.3059
Epoch 100/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6515 - loss: 0.8136 - val_accuracy: 0.4167 - val_loss: 1.3036
Epoch 101/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6358 - loss: 0.8153 - val_accuracy: 0.3750 - val_loss: 1.3028
Epoch 102/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6571 - loss: 0.8296 - val_accuracy: 0.4167 - val_loss: 1.3009
Epoch 103/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6319 - loss: 0.7917 - val_accuracy: 0.3750 - val_loss: 1.3020
Epoch 104/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6785 - loss: 0.7649 - val_accuracy: 0.4167 - val_loss: 1.3056
Epoch 105/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6477 - loss: 0.8297 - val_accuracy: 0.3750 - val_loss: 1.3039
Epoch 106/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6248 - loss: 0.8191 - val_accuracy: 0.3750 - val_loss: 1.3018
Epoch 107/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6204 - loss: 0.8175 - val_accuracy: 0.3750 - val_loss: 1.2994
Epoch 108/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6865 - loss: 0.7714 - val_accuracy: 0.3750 - val_loss: 1.3019
Epoch 109/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6681 - loss: 0.7506 - val_accuracy: 0.3750 - val_loss: 1.2993
Epoch 110/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6525 - loss: 0.7519 - val_accuracy: 0.4167 - val_loss: 1.2984
Epoch 111/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6781 - loss: 0.7217 - val_accuracy: 0.4167 - val_loss: 1.2959
Epoch 112/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6648 - loss: 0.7860 - val_accuracy: 0.3750 - val_loss: 1.2945
Epoch 113/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6898 - loss: 0.7118 - val_accuracy: 0.4167 - val_loss: 1.2961
Epoch 114/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6431 - loss: 0.7594 - val_accuracy: 0.3750 - val_loss: 1.2899
Epoch 115/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6065 - loss: 0.7889 - val_accuracy: 0.3750 - val_loss: 1.2898
Epoch 116/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6325 - loss: 0.7566 - val_accuracy: 0.4167 - val_loss: 1.2878
Epoch 117/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6938 - loss: 0.7374 - val_accuracy: 0.4167 - val_loss: 1.2886
Epoch 118/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6654 - loss: 0.7213 - val_accuracy: 0.4167 - val_loss: 1.2876
Epoch 119/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.6454 - loss: 0.7710 - val_accuracy: 0.4167 - val_loss: 1.2901
Epoch 120/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6821 - loss: 0.7105 - val_accuracy: 0.4167 - val_loss: 1.2884
Epoch 121/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.6698 - loss: 0.7266 - val_accuracy: 0.4167 - val_loss: 1.2886
Epoch 122/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6515 - loss: 0.7473 - val_accuracy: 0.4167 - val_loss: 1.2883
Epoch 123/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6515 - loss: 0.7446 - val_accuracy: 0.3750 - val_loss: 1.2856
Epoch 124/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6175 - loss: 0.7168 - val_accuracy: 0.4583 - val_loss: 1.2867
Epoch 125/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6231 - loss: 0.7681 - val_accuracy: 0.4167 - val_loss: 1.2839
Epoch 126/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6219 - loss: 0.7529 - val_accuracy: 0.4583 - val_loss: 1.2982
Epoch 127/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6777 - loss: 0.7752 - val_accuracy: 0.4167 - val_loss: 1.2876
Epoch 128/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.6204 - loss: 0.7573 - val_accuracy: 0.4167 - val_loss: 1.2869
Epoch 129/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.7388 - loss: 0.6735 - val_accuracy: 0.4167 - val_loss: 1.2818
Epoch 130/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.7240 - loss: 0.6875 - val_accuracy: 0.4583 - val_loss: 1.2770
Epoch 131/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.6581 - loss: 0.6921 - val_accuracy: 0.4167 - val_loss: 1.2795
Epoch 132/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6944 - loss: 0.6716 - val_accuracy: 0.4167 - val_loss: 1.2818
Epoch 133/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6427 - loss: 0.7374 - val_accuracy: 0.4167 - val_loss: 1.2787
Epoch 134/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6977 - loss: 0.7304 - val_accuracy: 0.4167 - val_loss: 1.2802
Epoch 135/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.7384 - loss: 0.6484 - val_accuracy: 0.3750 - val_loss: 1.2777
Epoch 136/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.7096 - loss: 0.7498 - val_accuracy: 0.4167 - val_loss: 1.2836
Epoch 137/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 32ms/step - accuracy: 0.7353 - loss: 0.7140 - val_accuracy: 0.4583 - val_loss: 1.2880
Epoch 138/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 52ms/step - accuracy: 0.7759 - loss: 0.6700 - val_accuracy: 0.4583 - val_loss: 1.2803
Epoch 139/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.7853 - loss: 0.6522 - val_accuracy: 0.4167 - val_loss: 1.2812
Epoch 140/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 38ms/step - accuracy: 0.7619 - loss: 0.6832 - val_accuracy: 0.4167 - val_loss: 1.2844
Epoch 141/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 44ms/step - accuracy: 0.7499 - loss: 0.6907 - val_accuracy: 0.3750 - val_loss: 1.2794
Epoch 142/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.7426 - loss: 0.6961 - val_accuracy: 0.4167 - val_loss: 1.2783
Epoch 143/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 56ms/step - accuracy: 0.7630 - loss: 0.6865 - val_accuracy: 0.4583 - val_loss: 1.3003
Epoch 144/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 35ms/step - accuracy: 0.7822 - loss: 0.6712 - val_accuracy: 0.4167 - val_loss: 1.2883
Epoch 145/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 45ms/step - accuracy: 0.7845 - loss: 0.6814 - val_accuracy: 0.4167 - val_loss: 1.2876
Epoch 146/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.7649 - loss: 0.6717 - val_accuracy: 0.4167 - val_loss: 1.2863
Epoch 147/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 40ms/step - accuracy: 0.8038 - loss: 0.6365 - val_accuracy: 0.4167 - val_loss: 1.2827
Epoch 148/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 38ms/step - accuracy: 0.8230 - loss: 0.6578 - val_accuracy: 0.4167 - val_loss: 1.2770
Epoch 149/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.8251 - loss: 0.6472 - val_accuracy: 0.3750 - val_loss: 1.2803
Epoch 150/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.8218 - loss: 0.6343 - val_accuracy: 0.4583 - val_loss: 1.2799
Epoch 151/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 38ms/step - accuracy: 0.8007 - loss: 0.6470 - val_accuracy: 0.4583 - val_loss: 1.2772
Epoch 152/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.8251 - loss: 0.6402 - val_accuracy: 0.5000 - val_loss: 1.2781
Epoch 153/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 46ms/step - accuracy: 0.8280 - loss: 0.6423 - val_accuracy: 0.5000 - val_loss: 1.2738
Epoch 154/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 42ms/step - accuracy: 0.8268 - loss: 0.6072 - val_accuracy: 0.4583 - val_loss: 1.2742
Epoch 155/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 34ms/step - accuracy: 0.8380 - loss: 0.6246 - val_accuracy: 0.5417 - val_loss: 1.2712
Epoch 156/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 35ms/step - accuracy: 0.8032 - loss: 0.6301 - val_accuracy: 0.4583 - val_loss: 1.2754
Epoch 157/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 50ms/step - accuracy: 0.7984 - loss: 0.6565 - val_accuracy: 0.4583 - val_loss: 1.2792
Epoch 158/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 41ms/step - accuracy: 0.8261 - loss: 0.6127 - val_accuracy: 0.5000 - val_loss: 1.2758
Epoch 159/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.8624 - loss: 0.6041 - val_accuracy: 0.5000 - val_loss: 1.2801
Epoch 160/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 46ms/step - accuracy: 0.8847 - loss: 0.6031 - val_accuracy: 0.4583 - val_loss: 1.2778
Epoch 161/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 39ms/step - accuracy: 0.8618 - loss: 0.5725 - val_accuracy: 0.5417 - val_loss: 1.2813
Epoch 162/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8491 - loss: 0.6187 - val_accuracy: 0.5417 - val_loss: 1.2832
Epoch 163/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.7897 - loss: 0.6523 - val_accuracy: 0.5000 - val_loss: 1.2802
Epoch 164/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.7828 - loss: 0.5943 - val_accuracy: 0.5417 - val_loss: 1.2843
Epoch 165/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.8580 - loss: 0.5891 - val_accuracy: 0.5417 - val_loss: 1.2856
Epoch 166/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8747 - loss: 0.5656 - val_accuracy: 0.5000 - val_loss: 1.2818
Epoch 167/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8641 - loss: 0.5841 - val_accuracy: 0.5417 - val_loss: 1.2936
Epoch 168/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8341 - loss: 0.5856 - val_accuracy: 0.5417 - val_loss: 1.2937
Epoch 169/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.8664 - loss: 0.5768 - val_accuracy: 0.5000 - val_loss: 1.2878
Epoch 170/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8614 - loss: 0.5481 - val_accuracy: 0.5417 - val_loss: 1.2950
Epoch 171/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8474 - loss: 0.5661 - val_accuracy: 0.5417 - val_loss: 1.2960
Epoch 172/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.7974 - loss: 0.5993 - val_accuracy: 0.5417 - val_loss: 1.3017
Epoch 173/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.8253 - loss: 0.5682 - val_accuracy: 0.5417 - val_loss: 1.3057
Epoch 174/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8614 - loss: 0.5635 - val_accuracy: 0.5000 - val_loss: 1.2923
Epoch 175/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.7645 - loss: 0.5836 - val_accuracy: 0.5417 - val_loss: 1.3066
Epoch 176/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8280 - loss: 0.5755 - val_accuracy: 0.5417 - val_loss: 1.3024
Epoch 177/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8397 - loss: 0.5599 - val_accuracy: 0.5417 - val_loss: 1.3088
Epoch 178/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8876 - loss: 0.5529 - val_accuracy: 0.5000 - val_loss: 1.3041
Epoch 179/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.8426 - loss: 0.5837 - val_accuracy: 0.5417 - val_loss: 1.3028
Epoch 180/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.8234 - loss: 0.5508 - val_accuracy: 0.5417 - val_loss: 1.3158
Epoch 181/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8920 - loss: 0.5151 - val_accuracy: 0.5000 - val_loss: 1.3082
Epoch 182/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8570 - loss: 0.5993 - val_accuracy: 0.5417 - val_loss: 1.3230
Epoch 183/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8543 - loss: 0.5725 - val_accuracy: 0.5417 - val_loss: 1.3279
Epoch 184/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8726 - loss: 0.5397 - val_accuracy: 0.5417 - val_loss: 1.3240
Epoch 185/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8843 - loss: 0.4978 - val_accuracy: 0.5417 - val_loss: 1.3208
Epoch 186/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 32ms/step - accuracy: 0.8564 - loss: 0.5186 - val_accuracy: 0.5417 - val_loss: 1.3221
Epoch 187/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9043 - loss: 0.4836 - val_accuracy: 0.5000 - val_loss: 1.3141
Epoch 188/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8314 - loss: 0.5147 - val_accuracy: 0.5417 - val_loss: 1.3281
Epoch 189/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8826 - loss: 0.5266 - val_accuracy: 0.5417 - val_loss: 1.3307
Epoch 190/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8943 - loss: 0.5007 - val_accuracy: 0.5417 - val_loss: 1.3282
Epoch 191/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8926 - loss: 0.4872 - val_accuracy: 0.5000 - val_loss: 1.3260
Epoch 192/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.8756 - loss: 0.5308 - val_accuracy: 0.5417 - val_loss: 1.3336
Epoch 193/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9010 - loss: 0.5127 - val_accuracy: 0.5417 - val_loss: 1.3331
Epoch 194/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9372 - loss: 0.4738 - val_accuracy: 0.5000 - val_loss: 1.3283
Epoch 195/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 33ms/step - accuracy: 0.8820 - loss: 0.4978 - val_accuracy: 0.5417 - val_loss: 1.3303
Epoch 196/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8816 - loss: 0.4886 - val_accuracy: 0.5000 - val_loss: 1.3244
Epoch 197/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.8433 - loss: 0.5594 - val_accuracy: 0.5417 - val_loss: 1.3374
Epoch 198/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9239 - loss: 0.4760 - val_accuracy: 0.5417 - val_loss: 1.3387
Epoch 199/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8966 - loss: 0.4665 - val_accuracy: 0.5417 - val_loss: 1.3437
Epoch 200/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9072 - loss: 0.4805 - val_accuracy: 0.5417 - val_loss: 1.3512
Epoch 201/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8856 - loss: 0.4917 - val_accuracy: 0.5417 - val_loss: 1.3594
Epoch 202/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9329 - loss: 0.4571 - val_accuracy: 0.5000 - val_loss: 1.3544
Epoch 203/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8956 - loss: 0.4736 - val_accuracy: 0.5417 - val_loss: 1.3687
Epoch 204/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8772 - loss: 0.4964 - val_accuracy: 0.5417 - val_loss: 1.3707
Epoch 205/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9089 - loss: 0.4725 - val_accuracy: 0.5000 - val_loss: 1.3773
Epoch 206/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8572 - loss: 0.4928 - val_accuracy: 0.5417 - val_loss: 1.3846
Epoch 207/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.9279 - loss: 0.4550 - val_accuracy: 0.5417 - val_loss: 1.3950
Epoch 208/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9362 - loss: 0.4360 - val_accuracy: 0.5417 - val_loss: 1.3862
Epoch 209/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.9062 - loss: 0.4616 - val_accuracy: 0.5417 - val_loss: 1.3874
Epoch 210/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.8822 - loss: 0.4927 - val_accuracy: 0.5417 - val_loss: 1.3936
Epoch 211/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9245 - loss: 0.4345 - val_accuracy: 0.5417 - val_loss: 1.3836
Epoch 212/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.9056 - loss: 0.4456 - val_accuracy: 0.5417 - val_loss: 1.3927
Epoch 213/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9262 - loss: 0.4343 - val_accuracy: 0.5417 - val_loss: 1.4020
Epoch 214/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9429 - loss: 0.4178 - val_accuracy: 0.5000 - val_loss: 1.3902
Epoch 215/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8956 - loss: 0.4403 - val_accuracy: 0.5000 - val_loss: 1.3923
Epoch 216/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.8906 - loss: 0.4537 - val_accuracy: 0.5000 - val_loss: 1.3994
Epoch 217/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.8922 - loss: 0.4269 - val_accuracy: 0.5000 - val_loss: 1.3997
Epoch 218/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9122 - loss: 0.4349 - val_accuracy: 0.5417 - val_loss: 1.4188
Epoch 219/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8756 - loss: 0.4753 - val_accuracy: 0.5000 - val_loss: 1.4131
Epoch 220/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9245 - loss: 0.4085 - val_accuracy: 0.5417 - val_loss: 1.4186
Epoch 221/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.9062 - loss: 0.4411 - val_accuracy: 0.5417 - val_loss: 1.4305
Epoch 222/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9379 - loss: 0.4239 - val_accuracy: 0.5417 - val_loss: 1.4283
Epoch 223/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9045 - loss: 0.4214 - val_accuracy: 0.5000 - val_loss: 1.4268
Epoch 224/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9262 - loss: 0.4191 - val_accuracy: 0.5000 - val_loss: 1.4265
Epoch 225/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9279 - loss: 0.4252 - val_accuracy: 0.4583 - val_loss: 1.4412
Epoch 226/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9335 - loss: 0.4420 - val_accuracy: 0.4583 - val_loss: 1.4444
Epoch 227/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9202 - loss: 0.4180 - val_accuracy: 0.5417 - val_loss: 1.4634
Epoch 228/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8962 - loss: 0.4319 - val_accuracy: 0.5417 - val_loss: 1.4736
Epoch 229/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9145 - loss: 0.3975 - val_accuracy: 0.5417 - val_loss: 1.4521
Epoch 230/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.9245 - loss: 0.3493 - val_accuracy: 0.5000 - val_loss: 1.4505
Epoch 231/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9162 - loss: 0.4144 - val_accuracy: 0.5417 - val_loss: 1.4671
Epoch 232/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8812 - loss: 0.4043 - val_accuracy: 0.5417 - val_loss: 1.4705
Epoch 233/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9329 - loss: 0.3728 - val_accuracy: 0.5000 - val_loss: 1.4710
Epoch 234/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9385 - loss: 0.3766 - val_accuracy: 0.5000 - val_loss: 1.4728
Epoch 235/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9162 - loss: 0.3558 - val_accuracy: 0.5000 - val_loss: 1.4818
Epoch 236/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9102 - loss: 0.3901 - val_accuracy: 0.5417 - val_loss: 1.4971
Epoch 237/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9395 - loss: 0.3715 - val_accuracy: 0.5000 - val_loss: 1.5063
Epoch 238/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9525 - loss: 0.3502 - val_accuracy: 0.5000 - val_loss: 1.5007
Epoch 239/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9302 - loss: 0.3950 - val_accuracy: 0.5417 - val_loss: 1.5094
Epoch 240/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9535 - loss: 0.3423 - val_accuracy: 0.5417 - val_loss: 1.5108
Epoch 241/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9385 - loss: 0.3503 - val_accuracy: 0.5417 - val_loss: 1.5281
Epoch 242/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9535 - loss: 0.3427 - val_accuracy: 0.5417 - val_loss: 1.5227
Epoch 243/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9029 - loss: 0.3412 - val_accuracy: 0.5000 - val_loss: 1.5108
Epoch 244/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9402 - loss: 0.3674 - val_accuracy: 0.5417 - val_loss: 1.5253
Epoch 245/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9345 - loss: 0.3490 - val_accuracy: 0.5000 - val_loss: 1.5232
Epoch 246/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 53ms/step - accuracy: 0.9306 - loss: 0.3507 - val_accuracy: 0.5417 - val_loss: 1.5481
Epoch 247/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 39ms/step - accuracy: 0.9195 - loss: 0.3307 - val_accuracy: 0.5000 - val_loss: 1.5393
Epoch 248/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 45ms/step - accuracy: 0.8862 - loss: 0.3562 - val_accuracy: 0.5000 - val_loss: 1.5598
Epoch 249/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 45ms/step - accuracy: 0.9235 - loss: 0.3615 - val_accuracy: 0.5417 - val_loss: 1.5598
Epoch 250/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 40ms/step - accuracy: 0.9352 - loss: 0.3216 - val_accuracy: 0.5417 - val_loss: 1.5613
Epoch 251/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 45ms/step - accuracy: 0.9141 - loss: 0.3936 - val_accuracy: 0.5417 - val_loss: 1.5746
Epoch 252/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.9681 - loss: 0.3164 - val_accuracy: 0.5417 - val_loss: 1.5711
Epoch 253/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.9585 - loss: 0.3067 - val_accuracy: 0.5000 - val_loss: 1.5718
Epoch 254/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 37ms/step - accuracy: 0.9291 - loss: 0.3404 - val_accuracy: 0.5417 - val_loss: 1.5752
Epoch 255/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.9625 - loss: 0.3237 - val_accuracy: 0.4583 - val_loss: 1.5688
Epoch 256/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 36ms/step - accuracy: 0.9385 - loss: 0.3349 - val_accuracy: 0.4583 - val_loss: 1.5781
Epoch 257/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 46ms/step - accuracy: 0.9741 - loss: 0.2887 - val_accuracy: 0.4583 - val_loss: 1.5776
Epoch 258/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 40ms/step - accuracy: 0.9641 - loss: 0.3096 - val_accuracy: 0.4583 - val_loss: 1.5849
Epoch 259/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 39ms/step - accuracy: 0.9085 - loss: 0.3653 - val_accuracy: 0.5000 - val_loss: 1.5906
Epoch 260/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 37ms/step - accuracy: 0.9235 - loss: 0.3249 - val_accuracy: 0.4583 - val_loss: 1.6062
Epoch 261/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 42ms/step - accuracy: 0.9531 - loss: 0.3222 - val_accuracy: 0.5000 - val_loss: 1.6126
Epoch 262/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 34ms/step - accuracy: 0.9631 - loss: 0.3054 - val_accuracy: 0.5000 - val_loss: 1.6118
Epoch 263/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9491 - loss: 0.3015 - val_accuracy: 0.5000 - val_loss: 1.6156
Epoch 264/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9708 - loss: 0.3059 - val_accuracy: 0.4583 - val_loss: 1.6222
Epoch 265/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9621 - loss: 0.2908 - val_accuracy: 0.5000 - val_loss: 1.6331
Epoch 266/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9564 - loss: 0.3132 - val_accuracy: 0.4583 - val_loss: 1.6384
Epoch 267/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.9281 - loss: 0.3247 - val_accuracy: 0.4583 - val_loss: 1.6469
Epoch 268/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.9854 - loss: 0.2632 - val_accuracy: 0.4583 - val_loss: 1.6473
Epoch 269/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9771 - loss: 0.2822 - val_accuracy: 0.4583 - val_loss: 1.6575
Epoch 270/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9381 - loss: 0.2891 - val_accuracy: 0.5417 - val_loss: 1.6809
Epoch 271/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9581 - loss: 0.2846 - val_accuracy: 0.4583 - val_loss: 1.6671
Epoch 272/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9771 - loss: 0.2865 - val_accuracy: 0.4583 - val_loss: 1.6783
Epoch 273/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9671 - loss: 0.2861 - val_accuracy: 0.5000 - val_loss: 1.6919
Epoch 274/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9671 - loss: 0.3108 - val_accuracy: 0.5000 - val_loss: 1.6899
Epoch 275/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9671 - loss: 0.2948 - val_accuracy: 0.4583 - val_loss: 1.6900
Epoch 276/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.9771 - loss: 0.2946 - val_accuracy: 0.5000 - val_loss: 1.7088
Epoch 277/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9854 - loss: 0.2607 - val_accuracy: 0.4583 - val_loss: 1.7044
Epoch 278/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9671 - loss: 0.2837 - val_accuracy: 0.5000 - val_loss: 1.7132
Epoch 279/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9771 - loss: 0.2824 - val_accuracy: 0.5000 - val_loss: 1.7119
Epoch 280/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9860 - loss: 0.2670 - val_accuracy: 0.4583 - val_loss: 1.7204
Epoch 281/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9910 - loss: 0.2806 - val_accuracy: 0.4583 - val_loss: 1.7227
Epoch 282/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9760 - loss: 0.2638 - val_accuracy: 0.5000 - val_loss: 1.7422
Epoch 283/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9860 - loss: 0.2589 - val_accuracy: 0.4583 - val_loss: 1.7458
Epoch 284/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9671 - loss: 0.2849 - val_accuracy: 0.5000 - val_loss: 1.7509
Epoch 285/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.9821 - loss: 0.2390 - val_accuracy: 0.5000 - val_loss: 1.7797
Epoch 286/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9910 - loss: 0.2631 - val_accuracy: 0.5000 - val_loss: 1.7620
Epoch 287/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9760 - loss: 0.2678 - val_accuracy: 0.5000 - val_loss: 1.7690
Epoch 288/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9944 - loss: 0.2304 - val_accuracy: 0.4583 - val_loss: 1.7574
Epoch 289/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9910 - loss: 0.2325 - val_accuracy: 0.5000 - val_loss: 1.7773
Epoch 290/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9860 - loss: 0.2653 - val_accuracy: 0.5000 - val_loss: 1.7805
Epoch 291/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9944 - loss: 0.2183 - val_accuracy: 0.4583 - val_loss: 1.7748
Epoch 292/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9860 - loss: 0.2349 - val_accuracy: 0.5000 - val_loss: 1.7954
Epoch 293/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9944 - loss: 0.2237 - val_accuracy: 0.4583 - val_loss: 1.7909
Epoch 294/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.9760 - loss: 0.2469 - val_accuracy: 0.4583 - val_loss: 1.8025
Epoch 295/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9860 - loss: 0.2225 - val_accuracy: 0.5000 - val_loss: 1.8003
Epoch 296/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.9910 - loss: 0.2378 - val_accuracy: 0.5000 - val_loss: 1.8076
Epoch 297/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.9910 - loss: 0.2239 - val_accuracy: 0.5000 - val_loss: 1.8099
Epoch 298/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.9944 - loss: 0.2239 - val_accuracy: 0.4583 - val_loss: 1.7990
Epoch 299/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9910 - loss: 0.2120 - val_accuracy: 0.4583 - val_loss: 1.8244
Epoch 300/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.9760 - loss: 0.2508 - val_accuracy: 0.4583 - val_loss: 1.8384

## Your code to plot training and validation curves in a single plot (Make changes in the model cell to be able to do this) : TODO
fig, axes = plt.subplots(1, 2, figsize=(14, 5))

# --- Loss curves ---
axes[0].plot(history.history['loss'], label='Train Loss', color='steelblue')
axes[0].plot(history.history['val_loss'], label='Validation Loss',
  color='tomato', linestyle='--')
axes[0].set_title('Training vs Validation Loss', fontweight='bold')
axes[0].set_xlabel('Epoch')
axes[0].set_ylabel('Loss')
axes[0].legend()

# --- Accuracy curves ---
axes[1].plot(history.history['accuracy'], label='Train Accuracy', color='steelblue')
axes[1].plot(history.history['val_accuracy'], label='Validation, Accuracy', color='tomato', linestyle='--')
axes[1].set_title('Training vs Validation Accuracy', fontweight='bold')
axes[1].set_xlabel('Epoch')
axes[1].set_ylabel('Accuracy')
axes[1].legend()

plt.suptitle('Training Curves', fontsize=14, fontweight='bold')
plt.tight_layout()
plt.show()

# Generate predicted y values
prediction_column_index = np.argmax(keras_model.predict(X_test_nn),
  axis=1)

# Extract correct prediction labels
category_order = ['Very Low', 'Low', 'Average', 'High', 'Very High']
prediction_labels = [category_order[i] for i in prediction_column_index]

# True labels for X_test
true_labels = [category_order[i] for i in y_test_cat.codes]

# Model performance
from sklearn.metrics import classification_report, confusion_matrix, accuracy_score

print("Keras Neural Network — Test Set Performance")
print(f"Accuracy: {accuracy_score(true_labels,
  prediction_labels):.4f}\n")
print(classification_report(true_labels, prediction_labels,
  target_names=category_order))

# Confusion matrix
cm = confusion_matrix(true_labels, prediction_labels,
  labels=category_order)
plt.figure(figsize=(7, 5))
sns.heatmap(cm, annot=True, fmt='d', cmap='Blues',
              xticklabels=category_order, yticklabels=category_order)
plt.title('Confusion Matrix — Keras Neural Network', fontweight='bold')
plt.ylabel('True Label')
plt.xlabel('Predicted Label')
plt.tight_layout()
plt.show()

2/2 ━━━━━━━━━━━━━━━━━━━━ 0s 134ms/step
Keras Neural Network — Test Set Performance
Accuracy: 0.6429

              precision    recall  f1-score   support

    Very Low       0.71      0.62      0.67         8
         Low       0.60      0.75      0.67         8
     Average       0.50      0.62      0.56         8
        High       1.00      0.67      0.80         9
   Very High       0.56      0.56      0.56         9

    accuracy                           0.64        42
   macro avg       0.67      0.64      0.65        42
weighted avg       0.68      0.64      0.65        42

# Write your lines of code here: TODO

from keras.layers import Dense, Dropout, BatchNormalization, Input
from keras.models import Sequential
from keras.callbacks import EarlyStopping

# Regularized model: Batch Normalization + Dropout after each hidden
# layer
keras_model_reg = Sequential([
    Input(shape=(feature_count,)), # Add Input layer to specify input shape
    Dense(128, activation='relu'),
    BatchNormalization(),
    Dropout(0.3),

    Dense(64, activation='relu'),
    BatchNormalization(),
    Dropout(0.3),

    Dense(64, activation='relu'),
    BatchNormalization(),
    Dropout(0.3),

    Dense(32, activation='relu'),
    BatchNormalization(),
    Dropout(0.2),

    Dense(5, activation='softmax')
])

keras_model_reg.compile(loss='categorical_crossentropy',
  optimizer='adam', metrics=['accuracy'])

early_stop = EarlyStopping(monitor='val_loss', patience=20,
  restore_best_weights=True)

history_reg = keras_model_reg.fit(
    X_train_nn, y_train_ohe,
    batch_size=20,
    epochs=300,
    validation_split=0.25,
    callbacks=[early_stop],
    verbose=1
)

# --- Compare training curves: before vs after regularization ---
fig, axes = plt.subplots(2, 2, figsize=(14, 10))

# Loss — original
axes[0,0].plot(history.history['loss'],     label='Train',
  color='steelblue')
axes[0,0].plot(history.history['val_loss'], label='Validation',
  color='tomato', linestyle='--')
axes[0,0].set_title('Loss — No Regularization', fontweight='bold')
axes[0,0].set_xlabel('Epoch')
axes[0,0].set_ylabel('Loss')
axes[0,0].legend()

# Loss — regularized
axes[0,1].plot(history_reg.history['loss'],     label='Train',
  color='steelblue')
axes[0,1].plot(history_reg.history['val_loss'], label='Validation',
  color='tomato', linestyle='--')
axes[0,1].set_title('Loss — With Regularization (Dropout + BN)',
  fontweight='bold')
axes[0,1].set_xlabel('Epoch')
axes[0,1].set_ylabel('Loss')
axes[0,1].legend()

# Accuracy — original
axes[1,0].plot(history.history['accuracy'],     label='Train',
  color='steelblue')
axes[1,0].plot(history.history['val_accuracy'], label='Validation',
  color='tomato', linestyle='--')
axes[1,0].set_title('Accuracy — No Regularization', fontweight='bold')
axes[1,0].set_xlabel('Epoch')
axes[1,0].set_ylabel('Accuracy')
axes[1,0].legend()

# Accuracy — regularized
axes[1,1].plot(history_reg.history['accuracy'],     label='Train',
  color='steelblue')
axes[1,1].plot(history_reg.history['val_accuracy'], label='Validation',
  color='tomato', linestyle='--')
axes[1,1].set_title('Accuracy — With Regularization (Dropout + BN)',
  fontweight='bold')
axes[1,1].set_xlabel('Epoch')
axes[1,1].set_ylabel('Accuracy')
axes[1,1].legend()

plt.suptitle('Before vs After Regularization', fontsize=14,
  fontweight='bold')
plt.tight_layout()
plt.show()

# --- Numeric comparison ---
pred_reg_idx    = np.argmax(keras_model_reg.predict(X_test_nn), axis=1)
pred_reg_labels = [category_order[i] for i in pred_reg_idx]

print("=== Before Regularization ===")
print(f"Test Accuracy:  {accuracy_score(true_labels,
  prediction_labels):.4f}")

print("\n=== After Regularization ===")
print(f"Test Accuracy:  {accuracy_score(true_labels,
  pred_reg_labels):.4f}")
print(f"Stopped at epoch: {len(history_reg.history['loss'])}")
print("\n", classification_report(true_labels, pred_reg_labels,
  target_names=category_order))

Epoch 1/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 5s 137ms/step - accuracy: 0.1772 - loss: 2.5328 - val_accuracy: 0.1667 - val_loss: 1.6303
Epoch 2/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 42ms/step - accuracy: 0.1636 - loss: 2.0706 - val_accuracy: 0.1667 - val_loss: 1.6147
Epoch 3/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.3162 - loss: 1.9698 - val_accuracy: 0.1667 - val_loss: 1.6009
Epoch 4/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.3300 - loss: 1.8115 - val_accuracy: 0.2083 - val_loss: 1.5870
Epoch 5/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.2706 - loss: 1.7498 - val_accuracy: 0.2917 - val_loss: 1.5733
Epoch 6/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.3748 - loss: 1.7640 - val_accuracy: 0.3333 - val_loss: 1.5597
Epoch 7/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.3000 - loss: 1.5794 - val_accuracy: 0.2917 - val_loss: 1.5503
Epoch 8/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.3688 - loss: 1.4783 - val_accuracy: 0.3750 - val_loss: 1.5398
Epoch 9/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.4048 - loss: 1.4046 - val_accuracy: 0.3750 - val_loss: 1.5274
Epoch 10/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.5245 - loss: 1.2671 - val_accuracy: 0.3750 - val_loss: 1.5164
Epoch 11/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.3481 - loss: 1.5022 - val_accuracy: 0.2917 - val_loss: 1.5054
Epoch 12/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.4928 - loss: 1.2245 - val_accuracy: 0.2917 - val_loss: 1.4966
Epoch 13/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.3940 - loss: 1.4716 - val_accuracy: 0.2917 - val_loss: 1.4877
Epoch 14/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.5541 - loss: 1.1124 - val_accuracy: 0.2917 - val_loss: 1.4766
Epoch 15/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.4949 - loss: 1.5085 - val_accuracy: 0.3333 - val_loss: 1.4693
Epoch 16/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.4446 - loss: 1.2516 - val_accuracy: 0.3333 - val_loss: 1.4575
Epoch 17/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.4842 - loss: 1.1470 - val_accuracy: 0.2917 - val_loss: 1.4497
Epoch 18/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.3015 - loss: 1.2951 - val_accuracy: 0.2917 - val_loss: 1.4406
Epoch 19/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 34ms/step - accuracy: 0.4985 - loss: 1.2214 - val_accuracy: 0.2917 - val_loss: 1.4316
Epoch 20/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.4559 - loss: 1.1525 - val_accuracy: 0.2917 - val_loss: 1.4270
Epoch 21/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.5769 - loss: 1.1646 - val_accuracy: 0.2917 - val_loss: 1.4240
Epoch 22/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.5729 - loss: 1.1404 - val_accuracy: 0.3750 - val_loss: 1.4193
Epoch 23/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.4855 - loss: 1.2405 - val_accuracy: 0.3750 - val_loss: 1.4167
Epoch 24/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.5946 - loss: 0.9285 - val_accuracy: 0.4167 - val_loss: 1.4126
Epoch 25/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.5500 - loss: 0.9713 - val_accuracy: 0.4167 - val_loss: 1.4105
Epoch 26/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.6519 - loss: 1.0101 - val_accuracy: 0.4167 - val_loss: 1.4082
Epoch 27/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 44ms/step - accuracy: 0.5274 - loss: 1.1018 - val_accuracy: 0.4167 - val_loss: 1.4044
Epoch 28/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.4463 - loss: 0.9825 - val_accuracy: 0.3750 - val_loss: 1.3976
Epoch 29/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.6419 - loss: 0.9365 - val_accuracy: 0.4167 - val_loss: 1.3923
Epoch 30/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.5670 - loss: 0.9406 - val_accuracy: 0.4167 - val_loss: 1.3883
Epoch 31/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.4962 - loss: 1.0709 - val_accuracy: 0.4583 - val_loss: 1.3822
Epoch 32/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.5933 - loss: 1.1068 - val_accuracy: 0.4583 - val_loss: 1.3718
Epoch 33/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.6531 - loss: 0.9462 - val_accuracy: 0.4583 - val_loss: 1.3638
Epoch 34/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 35ms/step - accuracy: 0.6861 - loss: 0.9278 - val_accuracy: 0.4583 - val_loss: 1.3567
Epoch 35/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.5291 - loss: 1.1761 - val_accuracy: 0.4167 - val_loss: 1.3516
Epoch 36/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.6977 - loss: 0.8691 - val_accuracy: 0.4167 - val_loss: 1.3459
Epoch 37/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.6652 - loss: 0.8190 - val_accuracy: 0.4167 - val_loss: 1.3414
Epoch 38/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.6938 - loss: 0.9973 - val_accuracy: 0.4167 - val_loss: 1.3408
Epoch 39/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.6971 - loss: 0.8297 - val_accuracy: 0.4167 - val_loss: 1.3406
Epoch 40/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6133 - loss: 0.9976 - val_accuracy: 0.3750 - val_loss: 1.3429
Epoch 41/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.6365 - loss: 0.8858 - val_accuracy: 0.3750 - val_loss: 1.3410
Epoch 42/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 34ms/step - accuracy: 0.6907 - loss: 0.7513 - val_accuracy: 0.3750 - val_loss: 1.3446
Epoch 43/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6492 - loss: 0.8528 - val_accuracy: 0.3750 - val_loss: 1.3458
Epoch 44/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6648 - loss: 0.8196 - val_accuracy: 0.3750 - val_loss: 1.3458
Epoch 45/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6794 - loss: 0.8226 - val_accuracy: 0.3750 - val_loss: 1.3411
Epoch 46/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.6402 - loss: 0.8598 - val_accuracy: 0.3750 - val_loss: 1.3391
Epoch 47/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.6765 - loss: 0.8273 - val_accuracy: 0.3750 - val_loss: 1.3397
Epoch 48/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.7613 - loss: 0.7018 - val_accuracy: 0.3333 - val_loss: 1.3384
Epoch 49/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 31ms/step - accuracy: 0.7696 - loss: 0.6982 - val_accuracy: 0.3333 - val_loss: 1.3330
Epoch 50/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 41ms/step - accuracy: 0.7304 - loss: 0.6737 - val_accuracy: 0.3750 - val_loss: 1.3271
Epoch 51/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.6273 - loss: 0.8331 - val_accuracy: 0.4167 - val_loss: 1.3273
Epoch 52/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.6056 - loss: 0.8628 - val_accuracy: 0.4583 - val_loss: 1.3262
Epoch 53/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.7084 - loss: 0.7564 - val_accuracy: 0.3750 - val_loss: 1.3280
Epoch 54/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.6496 - loss: 0.8128 - val_accuracy: 0.3750 - val_loss: 1.3338
Epoch 55/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.7100 - loss: 0.6737 - val_accuracy: 0.3750 - val_loss: 1.3369
Epoch 56/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 27ms/step - accuracy: 0.7011 - loss: 0.8137 - val_accuracy: 0.3750 - val_loss: 1.3391
Epoch 57/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step - accuracy: 0.5864 - loss: 0.8873 - val_accuracy: 0.3750 - val_loss: 1.3450
Epoch 58/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 28ms/step - accuracy: 0.7736 - loss: 0.6911 - val_accuracy: 0.3750 - val_loss: 1.3519
Epoch 59/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 51ms/step - accuracy: 0.7096 - loss: 0.8004 - val_accuracy: 0.3333 - val_loss: 1.3562
Epoch 60/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 51ms/step - accuracy: 0.7586 - loss: 0.6616 - val_accuracy: 0.3333 - val_loss: 1.3580
Epoch 61/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.6904 - loss: 0.7342 - val_accuracy: 0.2917 - val_loss: 1.3607
Epoch 62/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 48ms/step - accuracy: 0.7384 - loss: 0.7093 - val_accuracy: 0.3333 - val_loss: 1.3599
Epoch 63/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 38ms/step - accuracy: 0.6985 - loss: 0.8100 - val_accuracy: 0.3750 - val_loss: 1.3633
Epoch 64/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 37ms/step - accuracy: 0.7044 - loss: 0.6311 - val_accuracy: 0.3750 - val_loss: 1.3700
Epoch 65/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.6465 - loss: 0.8903 - val_accuracy: 0.3750 - val_loss: 1.3775
Epoch 66/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 43ms/step - accuracy: 0.8005 - loss: 0.5860 - val_accuracy: 0.3750 - val_loss: 1.3825
Epoch 67/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 50ms/step - accuracy: 0.6727 - loss: 0.6632 - val_accuracy: 0.3750 - val_loss: 1.3864
Epoch 68/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 40ms/step - accuracy: 0.7653 - loss: 0.5980 - val_accuracy: 0.3333 - val_loss: 1.3978
Epoch 69/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 47ms/step - accuracy: 0.7423 - loss: 0.6217 - val_accuracy: 0.4167 - val_loss: 1.4075
Epoch 70/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 49ms/step - accuracy: 0.8001 - loss: 0.5922 - val_accuracy: 0.4583 - val_loss: 1.4172
Epoch 71/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 40ms/step - accuracy: 0.7615 - loss: 0.6086 - val_accuracy: 0.4583 - val_loss: 1.4258
Epoch 72/300
4/4 ━━━━━━━━━━━━━━━━━━━━ 0s 42ms/step - accuracy: 0.7832 - loss: 0.5337 - val_accuracy: 0.4583 - val_loss: 1.4331

2/2 ━━━━━━━━━━━━━━━━━━━━ 0s 149ms/step
=== Before Regularization ===
Test Accuracy:  0.6429

=== After Regularization ===
Test Accuracy:  0.6190
Stopped at epoch: 72

               precision    recall  f1-score   support

    Very Low       0.40      0.50      0.44         8
         Low       0.67      0.50      0.57         8
     Average       0.60      0.38      0.46         8
        High       0.89      0.89      0.89         9
   Very High       0.58      0.78      0.67         9

    accuracy                           0.62        42
   macro avg       0.63      0.61      0.61        42
weighted avg       0.63      0.62      0.61        42

from keras.models import Sequential
from keras.layers import Dense, LeakyReLU, Input
from keras.callbacks import EarlyStopping
from sklearn.metrics import accuracy_score
import pandas as pd

def build_model(activation):
    model = Sequential()
    if activation == 'leaky_relu':
        model.add(Input(shape=(feature_count,))) # Added Input layer to fix warning
        model.add(Dense(128))
        model.add(LeakyReLU(negative_slope=0.1))
        model.add(Dense(64))
        model.add(LeakyReLU(negative_slope=0.1))
        model.add(Dense(64))
        model.add(LeakyReLU(negative_slope=0.1))
        model.add(Dense(32))
        model.add(LeakyReLU(negative_slope=0.1))
    else:
        model.add(Input(shape=(feature_count,))) # Added Input layer to fix warning
        model.add(Dense(128, activation=activation))
        model.add(Dense(64,  activation=activation))
        model.add(Dense(64,  activation=activation))
        model.add(Dense(32,  activation=activation))

    model.add(Dense(5, activation='softmax'))
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

activations  = ['relu', 'leaky_relu', 'tanh', 'sigmoid']
results      = {}
histories    = {}
early_stop   = EarlyStopping(monitor='val_loss', patience=20, restore_best_weights=True)

for act in activations:
    print(f"\nTraining with activation: {act}")
    model = build_model(act)
    hist  = model.fit(
        X_train_nn, y_train_ohe,
        epochs=300,
        batch_size=20,
        validation_split=0.25,
        callbacks=[early_stop],
        verbose=0
    )
    histories[act] = hist
    pred_idx    = np.argmax(model.predict(X_test_nn), axis=1)
    pred_labels = [category_order[i] for i in pred_idx]
    acc         = accuracy_score(true_labels, pred_labels)
    val_acc     = max(hist.history['val_accuracy'])
    epochs_ran  = len(hist.history['loss'])
    results[act] = {'Test Accuracy': round(acc, 4),
                    'Best Val Accuracy': round(val_acc, 4),
                    'Epochs Run': epochs_ran}
    # Fixed unterminated f-string literal
    print(f"  Test Acc: {acc:.4f} | Best Val Acc: {val_acc:.4f} | Epochs: {epochs_ran}")

# --- Summary table ---
print("\n=== Activation Function Comparison ===")
print(pd.DataFrame(results).T.to_string())

# --- Plot val accuracy curves for all activations ---
fig, axes = plt.subplots(1, 2, figsize=(14, 5))
colors = ['steelblue', 'tomato', 'green', 'purple']

for act, color in zip(activations, colors):
    axes[0].plot(histories[act].history['val_loss'],     label=act, color=color)
    axes[1].plot(histories[act].history['val_accuracy'], label=act, color=color)

axes[0].set_title('Validation Loss by Activation Function', fontweight='bold')
axes[0].set_xlabel('Epoch')
axes[0].set_ylabel('Val Loss')
axes[0].legend()

axes[1].set_title('Validation Accuracy by Activation Function', fontweight='bold')
axes[1].set_xlabel('Epoch')
axes[1].set_ylabel('Val Accuracy')
axes[1].legend()

plt.suptitle('Activation Function Comparison', fontsize=14, fontweight='bold')
plt.tight_layout()
plt.show()

Training with activation: relu
2/2 ━━━━━━━━━━━━━━━━━━━━ 0s 71ms/step
  Test Acc: 0.5952 | Best Val Acc: 0.5417 | Epochs: 35

Training with activation: leaky_relu
2/2 ━━━━━━━━━━━━━━━━━━━━ 0s 107ms/step
  Test Acc: 0.5952 | Best Val Acc: 0.5000 | Epochs: 31

Training with activation: tanh
2/2 ━━━━━━━━━━━━━━━━━━━━ 0s 72ms/step
  Test Acc: 0.6190 | Best Val Acc: 0.5000 | Epochs: 24

Training with activation: sigmoid
2/2 ━━━━━━━━━━━━━━━━━━━━ 0s 85ms/step
  Test Acc: 0.6667 | Best Val Acc: 0.5000 | Epochs: 116

=== Activation Function Comparison ===
            Test Accuracy  Best Val Accuracy  Epochs Run
relu               0.5952             0.5417        35.0
leaky_relu         0.5952             0.5000        31.0
tanh               0.6190             0.5000        24.0
sigmoid            0.6667             0.5000       116.0

import shap
import matplotlib.pyplot as plt

shap.initjs()

# --- SHAP for Random Forest (best classical model) ---
# Get feature names after preprocessing
numeric_feature_names = numeric_features
ohe_feature_names     = preprocess.named_transformers_['cat']['onehot'] \
    .get_feature_names_out(categorical_features).tolist()
all_feature_names     = numeric_feature_names + ohe_feature_names

# Transform test data
X_test_proc = preprocess.transform(X_test)
if hasattr(X_test_proc, 'toarray'):
    X_test_proc = X_test_proc.toarray()

X_test_df = pd.DataFrame(X_test_proc, columns=all_feature_names)

# TreeExplainer — fast and exact for Random Forest (using the best GridSearchCV model)
explainer   = shap.TreeExplainer(gridmodel.best_estimator_)
shap_values = explainer.shap_values(X_test_df)

# --- Summary plot: mean absolute SHAP across all classes ---
plt.figure()
shap.summary_plot(
    shap_values,
    X_test_df,
    plot_type='bar',
    class_names=category_order,
    show=True
)

# --- Handle SHAP version differences ---
# Older SHAP: shap_values is a list of arrays [class_0, class_1, ...]
# Newer SHAP: shap_values is a 3D array (n_samples, n_features, n_classes)
if isinstance(shap_values, list):
    sv_very_high = shap_values[4]
    expected_val = explainer.expected_value[4]
else:
    sv_very_high = shap_values[:, :, 4]
    expected_val = explainer.expected_value[4] if hasattr(explainer.expected_value, '__len__') else explainer.expected_value

# --- Beeswarm plot for 'Very High' class (index 4) ---
plt.figure()
shap.summary_plot(
    sv_very_high,
    X_test_df,
    plot_type='dot',
    show=True
)

# --- Force plot for first test sample ---
shap.force_plot(
    expected_val,
    sv_very_high[0],
    X_test_df.iloc[0],
    matplotlib=True
)

## You are encouraged to try more experimentation and any other models by adding more code cells to this notebook:

## You can also try to import any new dataset pertaining to countries, merge it, and see if it helps the predictions.
## If it does not, try to explain why it wasn't helpful by exploring variable relationships.

#Try additional models and compare all:
from sklearn.svm import SVC
from sklearn.neighbors import KNeighborsClassifier
from sklearn.ensemble import GradientBoostingClassifier, BaggingClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score, classification_report
import pandas as pd

X_tr = preprocess.transform(X_train)
X_te = preprocess.transform(X_test)
if hasattr(X_tr, 'toarray'):
    X_tr = X_tr.toarray()
    X_te = X_te.toarray()

models = {
    'Random Forest (best)':      gridmodel.best_estimator_,
    'Gradient Boosting':
GradientBoostingClassifier(n_estimators=300, max_depth=4,
learning_rate=0.05, random_state=42),
    'SVM (RBF)':                 SVC(kernel='rbf', C=10, gamma='scale',
random_state=42),
    'KNN (k=5)':                 KNeighborsClassifier(n_neighbors=5,
metric='euclidean'),
    'Bagging':                   BaggingClassifier(n_estimators=200,
random_state=42),
    'Logistic Regression':       LogisticRegression(max_iter=1000,
random_state=42)
}

results = {}
for name, m in models.items():
    m.fit(X_tr, y_train)
    preds      = m.predict(X_te)
    train_acc  = m.score(X_tr, y_train)
    test_acc   = accuracy_score(y_test, preds)
    results[name] = {'Train Accuracy': round(train_acc, 4),
                       'Test Accuracy':  round(test_acc,  4),
                       'Overfit Gap':    round(train_acc - test_acc, 4)}

results_df = pd.DataFrame(results).T.sort_values('Test Accuracy',
ascending=False)
print(results_df.to_string())

# Bar chart comparison
results_df[['Train Accuracy', 'Test Accuracy']].plot(
    kind='bar', figsize=(12, 5), edgecolor='black',
    color=['steelblue', 'tomato'], ylim=(0, 1.05)
)
plt.title('Model Comparison — Train vs Test Accuracy',
fontweight='bold')
plt.xticks(rotation=30, ha='right')
plt.ylabel('Accuracy')
plt.axhline(0.2, linestyle='--', color='grey', label='Random baseline (5 classes)')
plt.legend()
plt.tight_layout()
plt.show()

                      Train Accuracy  Test Accuracy  Overfit Gap
Random Forest (best)          1.0000         0.6190       0.3810
SVM (RBF)                     0.9684         0.5476       0.4208
KNN (k=5)                     0.6421         0.5476       0.0945
Bagging                       1.0000         0.5238       0.4762
Gradient Boosting             1.0000         0.4762       0.5238
Logistic Regression           0.7789         0.4524       0.3266

#Best model: detailed report:
best_model_name = results_df.index[0]
best_model      = models[best_model_name]
best_preds      = best_model.predict(X_te)

print(f"Best model: {best_model_name}")
print(f"Test Accuracy: {accuracy_score(y_test, best_preds):.4f}\n")
print(classification_report(y_test, best_preds,
target_names=category_order))

cm = confusion_matrix(y_test, best_preds, labels=category_order)
plt.figure(figsize=(7, 5))
sns.heatmap(cm, annot=True, fmt='d', cmap='Blues',
            xticklabels=category_order, yticklabels=category_order)
plt.title(f'Confusion Matrix — {best_model_name}', fontweight='bold')
plt.ylabel('True Label')
plt.xlabel('Predicted Label')
plt.tight_layout()
plt.show()

Best model: Random Forest (best)
Test Accuracy: 0.6190

              precision    recall  f1-score   support

    Very Low       0.67      0.75      0.71         8
         Low       0.62      0.62      0.62         8
     Average       0.45      0.62      0.53         8
        High       0.86      0.67      0.75         9
   Very High       0.57      0.44      0.50         9

    accuracy                           0.62        42
   macro avg       0.63      0.62      0.62        42
weighted avg       0.64      0.62      0.62        42

	country	region	happiness_score	gdp_per_capita	social_support	healthy_life_expectancy	freedom_to_make_life_choices	generosity	perceptions_of_corruption
0	Finland	Western Europe	7.804	1.888	1.585	0.535	0.772	0.126	0.535
1	Denmark	Western Europe	7.586	1.949	1.548	0.537	0.734	0.208	0.525
2	Iceland	Western Europe	7.530	1.926	1.620	0.559	0.738	0.250	0.187
3	Israel	Middle East and North Africa	7.473	1.833	1.521	0.577	0.569	0.124	0.158
4	Netherlands	Western Europe	7.403	1.942	1.488	0.545	0.672	0.251	0.394
...	...	...	...	...	...	...	...	...	...
132	Congo (Kinshasa)	Sub-Saharan Africa	3.207	0.531	0.784	0.105	0.375	0.183	0.068
133	Zimbabwe	Sub-Saharan Africa	3.204	0.758	0.881	0.069	0.363	0.112	0.117
134	Sierra Leone	Sub-Saharan Africa	3.138	0.670	0.540	0.092	0.371	0.193	0.051
135	Lebanon	Middle East and North Africa	2.392	1.417	0.476	0.398	0.123	0.061	0.027
136	Afghanistan	South Asia	1.859	0.645	0.000	0.087	0.000	0.093	0.059

	country_name	population	population_below_poverty_line	hdi	life_expectancy	expected_years_of_schooling	mean_years_of_schooling	gni
0	India	1339180127	21.9	0.623559	68.322	11.696590	6.298834	5663.474799
1	Nigeria	190886311	70.0	0.527105	53.057	9.970482	6.000000	5442.901264
2	Mexico	129163276	46.2	0.761683	76.972	13.299090	8.554985	16383.106680
3	Pakistan	197015955	29.5	0.550354	66.365	8.106910	5.089460	5031.173074
4	Bangladesh	164669751	31.5	0.578824	71.985	10.178706	5.241577	3341.490722

	country	region	gdp_per_capita	social_support	healthy_life_expectancy	freedom_to_make_life_choices	generosity	perceptions_of_corruption	population	population_below_poverty_line	hdi	life_expectancy	expected_years_of_schooling	mean_years_of_schooling	gni
0	Madagascar	Sub-Saharan Africa	0.632	0.779	0.178	0.187	0.177	0.134	2.557090e+07	70.7	0.512149	65.515	10.346140	6.145955	1319.699397
1	Mauritania	Sub-Saharan Africa	1.099	0.764	0.244	0.320	0.130	0.195	4.420184e+06	31.0	0.513106	63.239	8.463790	4.266000	3527.264154
2	Mongolia	East Asia	1.379	1.494	0.244	0.425	0.239	0.058	3.075647e+06	21.6	0.734832	69.806	14.845520	9.750000	10449.207270
3	Tajikistan	Commonwealth of Independent States	0.972	1.248	0.291	0.599	0.104	0.292	8.921343e+06	31.5	0.627472	69.582	11.261860	10.355820	2600.585607
4	Ukraine	Central and Eastern Europe	1.358	1.354	0.355	0.551	0.265	0.016	4.422295e+07	24.1	0.743049	71.129	15.306720	11.340000	7361.011228
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
90	South Korea	East Asia	1.853	1.188	0.603	0.446	0.112	0.163	5.098221e+07	12.5	0.900992	82.128	16.587520	12.179211	34540.649270
91	Ethiopia	Sub-Saharan Africa	0.793	1.114	0.250	0.451	0.283	0.101	1.049574e+08	29.6	0.447750	64.602	8.351520	2.580780	1522.954782
92	China	East Asia	1.510	1.249	0.468	0.666	0.115	0.145	1.409517e+09	3.3	0.737681	75.963	13.535750	7.641840	13345.477460
93	Peru	Latin America and Caribbean	1.390	1.153	0.499	0.549	0.073	0.027	3.216548e+07	22.7	0.739749	74.814	13.386340	9.013470	11294.840330
94	Jamaica	Latin America and Caribbean	1.305	1.329	0.411	0.587	0.079	0.039	2.890299e+06	16.5	0.730041	75.820	12.835763	9.638854	8350.023078

	generosity	perceptions_of_corruption	interaction_feature1
0	0.162969	0.125751	0.020494
1	0.122218	0.178146	0.021773
2	0.214305	0.056380	0.012083
3	0.098940	0.256191	0.025348
4	0.235072	0.015873	0.003731

	generosity	perceptions_of_corruption	interaction_feature1
0	0.127513	0.138892	0.017711
1	0.062975	0.035367	0.002227
2	0.130151	0.152721	0.019877
3	0.149282	0.175633	0.026219
4	0.098940	0.131905	0.013051

	Missing Values	Percentage (%)
population_below_poverty_line	16	16.842105
mean_years_of_schooling	7	7.368421
expected_years_of_schooling	7	7.368421
life_expectancy	7	7.368421
gni	7	7.368421
population	6	6.315789
hdi	6	6.315789

	Missing Values	Percentage (%)
gni	3	7.142857
expected_years_of_schooling	3	7.142857
mean_years_of_schooling	3	7.142857
life_expectancy	3	7.142857
hdi	3	7.142857
population_below_poverty_line	3	7.142857
population	3	7.142857
healthy_life_expectancy	1	2.380952

	Count	Percentage (%)
perceptions_of_corruption	10.0	10.53
population	9.0	9.47
population_below_poverty_line	4.0	4.21
freedom_to_make_life_choices	3.0	3.16
social_support	2.0	2.11
gni	2.0	2.11
generosity	1.0	1.05
gdp_per_capita	1.0	1.05

	Row_Index	Feature	Value	Z-Score
3	46	healthy_life_expectancy	0.314	3.704516
1	30	social_support	0.0	3.582977
0	30	region	South Asia	3.508821
4	81	country	Venezuela	3.171483
2	45	freedom_to_make_life_choices	0.66	3.138927

Change	Original	Updated	Reason
Numeric imputation	`strategy='constant', fill_value=0`	`strategy='mean'`	Filling with 0 is misleading for features like `gdp_per_capita` — zero implies no GDP, which is factually wrong. Mean is a neutral, unbiased fill.
Categorical features	hardcoded `['region', 'sub-region']`	dynamic `select_dtypes`	`sub-region` does not exist in the dataset — hardcoding caused a `KeyError`. Dynamic detection is robust.
`remainder`	`passthrough`	`drop`	Passthrough would have leaked `country` (string) into the output, breaking model fitting.

Name	Type	Fitted?	Contains data?
`preprocessor` (ColumnTransformer)	sklearn object	No	No — just rules
`preprocess`	sklearn object	Yes	Yes — learned parameters
`preprocessor` (function)	Python function	N/A	No — just logic
`preprocessed_data`	NumPy array	N/A	Yes — transformed data

Student Identification & Submission Details¶

Submission Requirements¶

Project Submission Guidelines¶

Submission Due Date: March 9, 2026¶

Expectations¶

World Happiness Classification Competition¶

Project Objectives¶

Project Workflow¶

0. Loading Datasets¶

Conceptual Question¶

Add New Data¶

1. Exploratory Data Analysis and Visualization (EDAV)¶

Describe What You Observe¶

Missing Values Analysis¶

Distribution of Key Numerical Features¶

Distribution of Categorical Variables¶

Feature Correlation Analysis¶

Brief interpretations of correlations and collinearity¶

Interpretation from heatmaps¶

Bivariate Analysis and Relationship Exploration¶

Outlier Detection¶

Observations and General Comments¶

2. Feature Engineering¶

3. Data Preprocessing¶

Explanation¶

Conceptual Question¶

4. Model Training and Saving Artifacts¶

5. Model Evaluation¶

6. Hyperparameter Experimentation¶

Reflection on Hyperparameter Changes¶

Discussion Question¶

Discussion Question¶

7. Basic Deep Learning¶

Discussion Question¶

Discussion Question¶

Discussion Question¶

Plot Training Curves¶

Regularization: Dropout and Batch Normalization¶

Activation Function Experimentation¶

8. Explainability – SHAP Feature Importance¶

Experimentation¶

9. Final Report Submission (GitHub)¶

Instructions¶