from google.colab import drive
drive.mount('/content/drive')
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).

# path to read from
# Please adjust the path if your file is in a different subfolder within your Google Drive.
path = '/content/drive/MyDrive/Colab Notebooks/AI/classified_deforestation.csv'
# read csv
df = pd.read_csv(path)

# sanity check
print("Dataset Shape:", df.shape)

Dataset Shape: (103, 21)

# check for null (only the higest, if > 0 then dont)
df.isnull().sum().max()

0

# We drop the target AND all the temporary math columns we created so the model doesn't cheat
y = df['Deforestation_Critical']
# Define features (X) as all columns except the target 'Deforestation_Critical'
X = df.drop('Deforestation_Critical', axis=1)
# check for data balance
y.value_counts()

from sklearn.model_selection import train_test_split
# Perform 80/20 train-test split with stratification and random state
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42, stratify=y
)

# Display the shapes of the resulting datasets to confirm the split
print(f"Shape of X_train: {X_train.shape}")
print(f"Shape of X_test: {X_test.shape}")
print(f"Shape of y_train: {y_train.shape}")
print(f"Shape of y_test: {y_test.shape}")

Shape of X_train: (82, 20)
Shape of X_test: (21, 20)
Shape of y_train: (82,)
Shape of y_test: (21,)

grid = {
    'n_estimators': [50, 100, 150, 200, 250, 300],
    'max_depth': [3, 5, None],
    'min_samples_leaf': [2, 4, 6],
    'max_features': ['sqrt', 'log2']
}

from sklearn.model_selection import GridSearchCV
from sklearn.ensemble import RandomForestClassifier

# run gridsearch
rf_grid = GridSearchCV(
    RandomForestClassifier(random_state=42),
    grid,
    cv=5,
    scoring='f1',
    return_train_score=True
)
rf_grid.fit(X_train, y_train)

GridSearchCV(cv=5, estimator=RandomForestClassifier(random_state=42),
             param_grid={'max_depth': [3, 5, None],
                         'max_features': ['sqrt', 'log2'],
                         'min_samples_leaf': [2, 4, 6],
                         'n_estimators': [50, 100, 150, 200, 250, 300]},
             return_train_score=True, scoring='f1')

GridSearchCV(cv=5, estimator=RandomForestClassifier(random_state=42),
             param_grid={'max_depth': [3, 5, None],
                         'max_features': ['sqrt', 'log2'],
                         'min_samples_leaf': [2, 4, 6],
                         'n_estimators': [50, 100, 150, 200, 250, 300]},
             return_train_score=True, scoring='f1')

RandomForestClassifier(max_depth=3, min_samples_leaf=2, random_state=42)

RandomForestClassifier(max_depth=3, min_samples_leaf=2, random_state=42)

# see combinations and their scores, first transofmr to df
results = pd.DataFrame(rf_grid.cv_results_)

table = results[[
    'param_n_estimators',
    'param_max_depth',
    'param_min_samples_leaf',
    'param_max_features',
    'mean_train_score',      # score on train portion
    'mean_test_score',       # score on validation portion
    'std_test_score'         # stable?
]].sort_values('mean_test_score', ascending=False)

print(table.to_string())

     param_n_estimators param_max_depth  param_min_samples_leaf param_max_features  mean_train_score  mean_test_score  std_test_score
1                   100               3                       2               sqrt          0.900585         0.626667        0.180308
19                  100               3                       2               log2          0.900585         0.626667        0.180308
20                  150               3                       2               log2          0.881164         0.583333        0.149071
2                   150               3                       2               sqrt          0.881164         0.583333        0.149071
38                  150               5                       2               sqrt          0.968399         0.583333        0.149071
37                  100               5                       2               sqrt          0.974359         0.583333        0.149071
91                  100            None                       2               log2          0.979487         0.583333        0.149071
92                  150            None                       2               log2          0.979217         0.583333        0.149071
73                  100            None                       2               sqrt          0.979487         0.583333        0.149071
74                  150            None                       2               sqrt          0.979217         0.583333        0.149071
55                  100               5                       2               log2          0.974359         0.583333        0.149071
56                  150               5                       2               log2          0.968399         0.583333        0.149071
0                    50               3                       2               sqrt          0.894552         0.580000        0.157198
18                   50               3                       2               log2          0.894552         0.580000        0.157198
41                  300               5                       2               sqrt          0.984615         0.566667        0.133333
48                   50               5                       6               sqrt          0.814335         0.566667        0.133333
95                  300            None                       2               log2          0.994872         0.566667        0.133333
102                  50            None                       6               log2          0.814335         0.566667        0.133333
84                   50            None                       6               sqrt          0.814335         0.566667        0.133333
77                  300            None                       2               sqrt          0.994872         0.566667        0.133333
66                   50               5                       6               log2          0.814335         0.566667        0.133333
24                   50               3                       4               log2          0.842151         0.566667        0.133333
30                   50               3                       6               log2          0.814335         0.566667        0.133333
59                  300               5                       2               log2          0.984615         0.566667        0.133333
12                   50               3                       6               sqrt          0.814335         0.566667        0.133333
6                    50               3                       4               sqrt          0.842151         0.566667        0.133333
96                   50            None                       4               log2          0.875006         0.553333        0.125786
42                   50               5                       4               sqrt          0.875006         0.553333        0.125786
60                   50               5                       4               log2          0.875006         0.553333        0.125786
78                   50            None                       4               sqrt          0.875006         0.553333        0.125786
9                   200               3                       4               sqrt          0.838495         0.550000        0.145297
8                   150               3                       4               sqrt          0.837315         0.550000        0.145297
7                   100               3                       4               sqrt          0.851860         0.550000        0.145297
5                   300               3                       2               sqrt          0.881164         0.550000        0.145297
4                   250               3                       2               sqrt          0.887513         0.550000        0.145297
3                   200               3                       2               sqrt          0.887886         0.550000        0.145297
11                  300               3                       4               sqrt          0.833390         0.550000        0.145297
10                  250               3                       4               sqrt          0.838195         0.550000        0.145297
22                  250               3                       2               log2          0.887513         0.550000        0.145297
16                  250               3                       6               sqrt          0.792695         0.550000        0.145297
23                  300               3                       2               log2          0.881164         0.550000        0.145297
15                  200               3                       6               sqrt          0.797457         0.550000        0.145297
17                  300               3                       6               sqrt          0.800650         0.550000        0.145297
14                  150               3                       6               sqrt          0.807316         0.550000        0.145297
106                 250            None                       6               log2          0.799362         0.550000        0.145297
105                 200            None                       6               log2          0.803806         0.550000        0.145297
107                 300            None                       6               log2          0.800650         0.550000        0.145297
104                 150            None                       6               log2          0.807316         0.550000        0.145297
99                  200            None                       4               log2          0.864195         0.550000        0.145297
34                  250               3                       6               log2          0.792695         0.550000        0.145297
35                  300               3                       6               log2          0.800650         0.550000        0.145297
33                  200               3                       6               log2          0.797457         0.550000        0.145297
32                  150               3                       6               log2          0.807316         0.550000        0.145297
29                  300               3                       4               log2          0.833390         0.550000        0.145297
28                  250               3                       4               log2          0.838195         0.550000        0.145297
21                  200               3                       2               log2          0.887886         0.550000        0.145297
26                  150               3                       4               log2          0.837315         0.550000        0.145297
25                  100               3                       4               log2          0.851860         0.550000        0.145297
27                  200               3                       4               log2          0.838495         0.550000        0.145297
43                  100               5                       4               sqrt          0.875838         0.550000        0.145297
71                  300               5                       6               log2          0.800650         0.550000        0.145297
70                  250               5                       6               log2          0.799362         0.550000        0.145297
68                  150               5                       6               log2          0.807316         0.550000        0.145297
69                  200               5                       6               log2          0.803806         0.550000        0.145297
63                  200               5                       4               log2          0.864195         0.550000        0.145297
64                  250               5                       4               log2          0.864195         0.550000        0.145297
61                  100               5                       4               log2          0.875838         0.550000        0.145297
89                  300            None                       6               sqrt          0.800650         0.550000        0.145297
53                  300               5                       6               sqrt          0.800650         0.550000        0.145297
52                  250               5                       6               sqrt          0.799362         0.550000        0.145297
50                  150               5                       6               sqrt          0.807316         0.550000        0.145297
65                  300               5                       4               log2          0.864195         0.550000        0.145297
51                  200               5                       6               sqrt          0.803806         0.550000        0.145297
45                  200               5                       4               sqrt          0.864195         0.550000        0.145297
47                  300               5                       4               sqrt          0.864195         0.550000        0.145297
46                  250               5                       4               sqrt          0.864195         0.550000        0.145297
83                  300            None                       4               sqrt          0.864195         0.550000        0.145297
88                  250            None                       6               sqrt          0.799362         0.550000        0.145297
87                  200            None                       6               sqrt          0.803806         0.550000        0.145297
86                  150            None                       6               sqrt          0.807316         0.550000        0.145297
79                  100            None                       4               sqrt          0.875838         0.550000        0.145297
101                 300            None                       4               log2          0.864195         0.550000        0.145297
100                 250            None                       4               log2          0.864195         0.550000        0.145297
97                  100            None                       4               log2          0.875838         0.550000        0.145297
81                  200            None                       4               sqrt          0.864195         0.550000        0.145297
82                  250            None                       4               sqrt          0.864195         0.550000        0.145297
98                  150            None                       4               log2          0.857528         0.533333        0.124722
31                  100               3                       6               log2          0.821862         0.533333        0.124722
13                  100               3                       6               sqrt          0.821862         0.533333        0.124722
40                  250               5                       2               sqrt          0.979487         0.533333        0.124722
39                  200               5                       2               sqrt          0.973527         0.533333        0.124722
44                  150               5                       4               sqrt          0.857528         0.533333        0.124722
93                  200            None                       2               log2          0.989744         0.533333        0.124722
85                  100            None                       6               sqrt          0.839279         0.533333        0.124722
62                  150               5                       4               log2          0.857528         0.533333        0.124722
75                  200            None                       2               sqrt          0.989744         0.533333        0.124722
49                  100               5                       6               sqrt          0.839279         0.533333        0.124722
57                  200               5                       2               log2          0.973527         0.533333        0.124722
58                  250               5                       2               log2          0.979487         0.533333        0.124722
67                  100               5                       6               log2          0.839279         0.533333        0.124722
103                 100            None                       6               log2          0.839279         0.533333        0.124722
94                  250            None                       2               log2          0.989744         0.533333        0.124722
76                  250            None                       2               sqrt          0.989744         0.533333        0.124722
80                  150            None                       4               sqrt          0.857528         0.533333        0.124722
36                   50               5                       2               sqrt          0.989744         0.529091        0.112597
54                   50               5                       2               log2          0.989744         0.529091        0.112597
72                   50            None                       2               sqrt          0.989744         0.529091        0.112597
90                   50            None                       2               log2          0.989744         0.529091        0.112597

boosting_grid = {
    'n_estimators':      [50, 100, 150, 200],
    'learning_rate':     [0.01, 0.05, 0.1],
    'max_depth':         [3, 4, 5],
    'colsample_bytree':  [0.5, 1],
    'reg_lambda':        [1, 2],
}

from xgboost import XGBClassifier

xgb_grid = GridSearchCV(
    XGBClassifier(random_state=42, use_label_encoder=False, eval_metric='logloss'),
    param_grid=boosting_grid,
    cv=5,
    scoring='f1',
    n_jobs=-1,
    return_train_score=True
)

xgb_grid.fit(X_train, y_train)

/usr/local/lib/python3.12/dist-packages/xgboost/training.py:200: UserWarning: [17:51:37] WARNING: /__w/xgboost/xgboost/src/learner.cc:782: 
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)

GridSearchCV(cv=5,
             estimator=XGBClassifier(base_score=None, booster=None,
                                     callbacks=None, colsample_bylevel=None,
                                     colsample_bynode=None,
                                     colsample_bytree=None, device=None,
                                     early_stopping_rounds=None,
                                     enable_categorical=False,
                                     eval_metric='logloss', feature_types=None,
                                     feature_weights=None, gamma=None,
                                     grow_policy=None, importance_type=None,
                                     interaction_constraint...
                                     max_delta_step=None, max_depth=None,
                                     max_leaves=None, min_child_weight=None,
                                     missing=nan, monotone_constraints=None,
                                     multi_strategy=None, n_estimators=None,
                                     n_jobs=None, num_parallel_tree=None, ...),
             n_jobs=-1,
             param_grid={'colsample_bytree': [0.5, 1],
                         'learning_rate': [0.01, 0.05, 0.1],
                         'max_depth': [3, 4, 5],
                         'n_estimators': [50, 100, 150, 200],
                         'reg_lambda': [1, 2]},
             return_train_score=True, scoring='f1')

GridSearchCV(cv=5,
             estimator=XGBClassifier(base_score=None, booster=None,
                                     callbacks=None, colsample_bylevel=None,
                                     colsample_bynode=None,
                                     colsample_bytree=None, device=None,
                                     early_stopping_rounds=None,
                                     enable_categorical=False,
                                     eval_metric='logloss', feature_types=None,
                                     feature_weights=None, gamma=None,
                                     grow_policy=None, importance_type=None,
                                     interaction_constraint...
                                     max_delta_step=None, max_depth=None,
                                     max_leaves=None, min_child_weight=None,
                                     missing=nan, monotone_constraints=None,
                                     multi_strategy=None, n_estimators=None,
                                     n_jobs=None, num_parallel_tree=None, ...),
             n_jobs=-1,
             param_grid={'colsample_bytree': [0.5, 1],
                         'learning_rate': [0.01, 0.05, 0.1],
                         'max_depth': [3, 4, 5],
                         'n_estimators': [50, 100, 150, 200],
                         'reg_lambda': [1, 2]},
             return_train_score=True, scoring='f1')

XGBClassifier(base_score=None, booster=None, callbacks=None,
              colsample_bylevel=None, colsample_bynode=None,
              colsample_bytree=0.5, device=None, early_stopping_rounds=None,
              enable_categorical=False, eval_metric='logloss',
              feature_types=None, feature_weights=None, gamma=None,
              grow_policy=None, importance_type=None,
              interaction_constraints=None, learning_rate=0.05, max_bin=None,
              max_cat_threshold=None, max_cat_to_onehot=None,
              max_delta_step=None, max_depth=3, max_leaves=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              multi_strategy=None, n_estimators=50, n_jobs=None,
              num_parallel_tree=None, ...)

XGBClassifier(base_score=None, booster=None, callbacks=None,
              colsample_bylevel=None, colsample_bynode=None,
              colsample_bytree=0.5, device=None, early_stopping_rounds=None,
              enable_categorical=False, eval_metric='logloss',
              feature_types=None, feature_weights=None, gamma=None,
              grow_policy=None, importance_type=None,
              interaction_constraints=None, learning_rate=0.05, max_bin=None,
              max_cat_threshold=None, max_cat_to_onehot=None,
              max_delta_step=None, max_depth=3, max_leaves=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              multi_strategy=None, n_estimators=50, n_jobs=None,
              num_parallel_tree=None, ...)

results = pd.DataFrame(xgb_grid.cv_results_)

table = results[[
    'param_n_estimators',
    'param_learning_rate',
    'param_max_depth',
    'param_colsample_bytree',
    'param_reg_lambda',
    'mean_train_score',
    'mean_test_score',
    'std_test_score',
    'rank_test_score'      # rank 1 = best combo
]].sort_values('mean_test_score', ascending=False)

print(table.head(15).to_string())

    param_n_estimators  param_learning_rate  param_max_depth  param_colsample_bytree  param_reg_lambda  mean_train_score  mean_test_score  std_test_score  rank_test_score
32                  50                 0.05                4                     0.5                 1          0.989744         0.526234        0.194987                1
49                  50                 0.10                3                     0.5                 2          0.989744         0.526234        0.194987                1
57                  50                 0.10                4                     0.5                 2          0.994872         0.526234        0.194987                1
64                  50                 0.10                5                     0.5                 1          0.994872         0.526234        0.194987                1
65                  50                 0.10                5                     0.5                 2          0.994872         0.526234        0.194987                1
56                  50                 0.10                4                     0.5                 1          0.994872         0.526234        0.194987                1
43                 100                 0.05                5                     0.5                 2          0.994872         0.526234        0.194987                1
45                 150                 0.05                5                     0.5                 2          0.994872         0.526234        0.194987                1
42                 100                 0.05                5                     0.5                 1          0.994872         0.526234        0.194987                1
33                  50                 0.05                4                     0.5                 2          0.968129         0.526234        0.194987                1
35                 100                 0.05                4                     0.5                 2          0.994872         0.526234        0.194987                1
37                 150                 0.05                4                     0.5                 2          0.994872         0.526234        0.194987                1
27                 100                 0.05                3                     0.5                 2          0.989744         0.526234        0.194987                1
24                  50                 0.05                3                     0.5                 1          0.978656         0.526234        0.194987                1
25                  50                 0.05                3                     0.5                 2          0.968129         0.526234        0.194987                1

from sklearn.preprocessing import StandardScaler

# define the scaler
scaler = StandardScaler()

# fit the scaler to the training data
X_train_scaled = scaler.fit_transform(X_train)

# only transform the test to avoid data leakage
X_test_scaled = scaler.transform(X_test)

svm_grid = {
    'C': [0.1, 1, 10],
    'gamma': [0.1, 1],
    'kernel': ['linear', 'rbf'],
}

from sklearn.svm import SVC

svm_grid = GridSearchCV(
    SVC(probability=True, random_state=42),
    param_grid=svm_grid,
    cv=5,
    scoring='f1',
    n_jobs=-1,
    return_train_score=True
)

svm_grid.fit(X_train_scaled, y_train)

GridSearchCV(cv=5, estimator=SVC(probability=True, random_state=42), n_jobs=-1,
             param_grid={'C': [0.1, 1, 10], 'gamma': [0.1, 1],
                         'kernel': ['linear', 'rbf']},
             return_train_score=True, scoring='f1')

GridSearchCV(cv=5, estimator=SVC(probability=True, random_state=42), n_jobs=-1,
             param_grid={'C': [0.1, 1, 10], 'gamma': [0.1, 1],
                         'kernel': ['linear', 'rbf']},
             return_train_score=True, scoring='f1')

SVC(C=0.1, gamma=0.1, kernel='linear', probability=True, random_state=42)

SVC(C=0.1, gamma=0.1, kernel='linear', probability=True, random_state=42)

results = pd.DataFrame(svm_grid.cv_results_)

table = results[[
    'param_kernel',
    'param_C',
    'param_gamma',
    'mean_train_score',
    'mean_test_score',
    'std_test_score',
    'rank_test_score'
]].sort_values('mean_test_score', ascending=False)

print(table.head(15).to_string())

   param_kernel  param_C  param_gamma  mean_train_score  mean_test_score  std_test_score  rank_test_score
0        linear      0.1          0.1          0.818194         0.619814        0.174714                1
2        linear      0.1          1.0          0.818194         0.619814        0.174714                1
9           rbf     10.0          0.1          1.000000         0.619402        0.192128                3
5           rbf      1.0          0.1          0.922267         0.605556        0.187906                4
6        linear      1.0          1.0          0.870112         0.556190        0.157140                5
4        linear      1.0          0.1          0.870112         0.556190        0.157140                5
10       linear     10.0          1.0          0.935311         0.532900        0.175319                7
8        linear     10.0          0.1          0.935311         0.532900        0.175319                7
3           rbf      0.1          1.0          0.000000         0.000000        0.000000                9
1           rbf      0.1          0.1          0.000000         0.000000        0.000000                9
7           rbf      1.0          1.0          1.000000         0.000000        0.000000                9
11          rbf     10.0          1.0          1.000000         0.000000        0.000000                9

import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping

# Set the random seed for reproducible results
tf.random.set_seed(42)

nn_model = Sequential([
    Dense(16, activation='relu', input_shape=(X_train_scaled.shape[1],)),
    Dense(8, activation='relu'),
    Dense(1,  activation='sigmoid')
])

nn_model.compile(
    optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
    loss='binary_crossentropy',
    metrics=['accuracy']
)

early_stop = EarlyStopping(
    monitor='val_loss',
    patience=10,
    restore_best_weights=True
)

history = nn_model.fit(
    X_train_scaled, y_train,
    epochs=100,
    batch_size=16,
    validation_split=0.2,
    callbacks=[early_stop],
    verbose=1
)

nn_model.summary()

Epoch 1/100

/usr/local/lib/python3.12/dist-packages/keras/src/layers/core/dense.py:106: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

5/5 ━━━━━━━━━━━━━━━━━━━━ 2s 107ms/step - accuracy: 0.5231 - loss: 0.6993 - val_accuracy: 0.5882 - val_loss: 0.7116
Epoch 2/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.5231 - loss: 0.6749 - val_accuracy: 0.5882 - val_loss: 0.6933
Epoch 3/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 22ms/step - accuracy: 0.6154 - loss: 0.6557 - val_accuracy: 0.6471 - val_loss: 0.6771
Epoch 4/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.6769 - loss: 0.6385 - val_accuracy: 0.6471 - val_loss: 0.6621
Epoch 5/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.7231 - loss: 0.6224 - val_accuracy: 0.7059 - val_loss: 0.6477
Epoch 6/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.7231 - loss: 0.6073 - val_accuracy: 0.8235 - val_loss: 0.6340
Epoch 7/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.7385 - loss: 0.5931 - val_accuracy: 0.8824 - val_loss: 0.6209
Epoch 8/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.7692 - loss: 0.5792 - val_accuracy: 0.8824 - val_loss: 0.6086
Epoch 9/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.7846 - loss: 0.5658 - val_accuracy: 0.8824 - val_loss: 0.5972
Epoch 10/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 23ms/step - accuracy: 0.7846 - loss: 0.5527 - val_accuracy: 0.8824 - val_loss: 0.5864
Epoch 11/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.7692 - loss: 0.5401 - val_accuracy: 0.8824 - val_loss: 0.5766
Epoch 12/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.7846 - loss: 0.5282 - val_accuracy: 0.8824 - val_loss: 0.5675
Epoch 13/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.7846 - loss: 0.5165 - val_accuracy: 0.8824 - val_loss: 0.5588
Epoch 14/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.7846 - loss: 0.5051 - val_accuracy: 0.8824 - val_loss: 0.5503
Epoch 15/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8154 - loss: 0.4942 - val_accuracy: 0.8824 - val_loss: 0.5411
Epoch 16/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8308 - loss: 0.4838 - val_accuracy: 0.8824 - val_loss: 0.5325
Epoch 17/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8462 - loss: 0.4737 - val_accuracy: 0.8824 - val_loss: 0.5248
Epoch 18/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8462 - loss: 0.4639 - val_accuracy: 0.8824 - val_loss: 0.5178
Epoch 19/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.8769 - loss: 0.4543 - val_accuracy: 0.8824 - val_loss: 0.5114
Epoch 20/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 19ms/step - accuracy: 0.8769 - loss: 0.4449 - val_accuracy: 0.8824 - val_loss: 0.5057
Epoch 21/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 19ms/step - accuracy: 0.8769 - loss: 0.4358 - val_accuracy: 0.8824 - val_loss: 0.5006
Epoch 22/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 19ms/step - accuracy: 0.8769 - loss: 0.4268 - val_accuracy: 0.8824 - val_loss: 0.4961
Epoch 23/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8769 - loss: 0.4180 - val_accuracy: 0.8824 - val_loss: 0.4916
Epoch 24/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 19ms/step - accuracy: 0.8769 - loss: 0.4092 - val_accuracy: 0.8824 - val_loss: 0.4875
Epoch 25/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8769 - loss: 0.4003 - val_accuracy: 0.8824 - val_loss: 0.4839
Epoch 26/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3917 - val_accuracy: 0.8824 - val_loss: 0.4807
Epoch 27/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3836 - val_accuracy: 0.8824 - val_loss: 0.4775
Epoch 28/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.8923 - loss: 0.3757 - val_accuracy: 0.8824 - val_loss: 0.4735
Epoch 29/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3680 - val_accuracy: 0.8824 - val_loss: 0.4702
Epoch 30/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8769 - loss: 0.3607 - val_accuracy: 0.8824 - val_loss: 0.4675
Epoch 31/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8769 - loss: 0.3535 - val_accuracy: 0.8824 - val_loss: 0.4652
Epoch 32/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3464 - val_accuracy: 0.8824 - val_loss: 0.4633
Epoch 33/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3396 - val_accuracy: 0.8824 - val_loss: 0.4616
Epoch 34/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3332 - val_accuracy: 0.8824 - val_loss: 0.4602
Epoch 35/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8923 - loss: 0.3269 - val_accuracy: 0.8824 - val_loss: 0.4599
Epoch 36/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.3209 - val_accuracy: 0.8824 - val_loss: 0.4602
Epoch 37/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 30ms/step - accuracy: 0.8923 - loss: 0.3150 - val_accuracy: 0.8235 - val_loss: 0.4606
Epoch 38/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8923 - loss: 0.3094 - val_accuracy: 0.8235 - val_loss: 0.4613
Epoch 39/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8923 - loss: 0.3041 - val_accuracy: 0.8235 - val_loss: 0.4621
Epoch 40/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 22ms/step - accuracy: 0.8923 - loss: 0.2989 - val_accuracy: 0.8235 - val_loss: 0.4630
Epoch 41/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 19ms/step - accuracy: 0.8769 - loss: 0.2939 - val_accuracy: 0.8235 - val_loss: 0.4638
Epoch 42/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.2891 - val_accuracy: 0.8235 - val_loss: 0.4646
Epoch 43/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 21ms/step - accuracy: 0.8923 - loss: 0.2843 - val_accuracy: 0.8235 - val_loss: 0.4656
Epoch 44/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 19ms/step - accuracy: 0.8923 - loss: 0.2797 - val_accuracy: 0.8235 - val_loss: 0.4666
Epoch 45/100
5/5 ━━━━━━━━━━━━━━━━━━━━ 0s 20ms/step - accuracy: 0.8923 - loss: 0.2752 - val_accuracy: 0.8235 - val_loss: 0.4676

Model: "sequential_1"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ dense_3 (Dense)                 │ (None, 16)             │           336 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_4 (Dense)                 │ (None, 8)              │           136 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_5 (Dense)                 │ (None, 1)              │             9 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 1,445 (5.65 KB)

 Trainable params: 481 (1.88 KB)

 Non-trainable params: 0 (0.00 B)

 Optimizer params: 964 (3.77 KB)

from sklearn.metrics import f1_score

# 1. Ask the model to predict probabilities for the training data
nn_train_probs = nn_model.predict(X_train_scaled, verbose=0)

# 2. Convert probabilities (> 0.5) into hard 1s and 0s
nn_train_preds = (nn_train_probs > 0.5).astype(int)

# 3. Calculate the F1 Score
nn_train_f1 = f1_score(y_train, nn_train_preds)
print(f"Neural Network Training F1-Score: {nn_train_f1:.4f}")

Neural Network Training F1-Score: 0.8163

# Random Forest Predictions (Uses original X_test)
rf_preds = rf_grid.predict(X_test)
rf_f1 = f1_score(y_test, rf_preds)

# XGBoost Predictions
xgb_preds = xgb_grid.predict(X_test)
xgb_f1 = f1_score(y_test, xgb_preds)

# SVM Predictions (Uses X_test_scaled)
svm_preds = svm_grid.predict(X_test_scaled)
svm_f1 = f1_score(y_test, svm_preds)

# Neural Network Predictions (Uses X_test_scaled)
nn_probs = nn_model.predict(X_test_scaled, verbose=0)
# convert probability to binary
nn_preds = (nn_probs > 0.5).astype(int)
nn_f1 = f1_score(y_test, nn_preds)

# Get the final comparation
leaderboard = pd.DataFrame({
    'Model': ['Random Forest', 'XGBoost', 'SVM', 'Neural Network'],
    'Test F1-Score': [rf_f1, xgb_f1, svm_f1, nn_f1]
})

# Sort the leaderboard from highest score to lowest score
leaderboard = leaderboard.sort_values(by='Test F1-Score', ascending=False).reset_index(drop=True)

print(leaderboard.to_string(index=False))

         Model  Test F1-Score
  SVM (Linear)       0.727273
Neural Network       0.666667
 Random Forest       0.500000
       XGBoost       0.285714

Overview and Introduction¶

Data splitting¶

Ensemble Models¶

Random Forest¶

Boosting¶

Support Vector Machines¶

Neural Networks¶

Final Testing¶

Conclusion¶

References¶

	count
Deforestation_Critical
0	72
1	31