Test_Test_GWML_XGBoost.py


import pickle as pk
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import os
from sklearn.preprocessing import MinMaxScaler
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.ensemble import RandomForestClassifier, RandomForestRegressor
from scipy.spatial.distance import pdist, squareform
import xgboost as xgb
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import confusion_matrix, accuracy_score, precision_score, recall_score, f1_score, roc_auc_score, classification_report
from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score, make_scorer
import math
from sklearn.model_selection import RandomizedSearchCV
from scipy.stats import randint
import random
import seaborn as sns
from sklearn.preprocessing import binarize
from sklearn.model_selection import cross_val_score, StratifiedKFold
import geopandas as gpd
from shapely.geometry import Point
from sklearn.linear_model import LinearRegression
from fiona.crs import from_epsg

################### Configuration #####################
kernel = 'adaptive' # adaptive or fixed
bw = 135 # Band Width for local models
mincatobs = 10 # minimum number of labels in each class for local models
LocalSoatialWeight = 'Bi-square'  # Bi-square or Gaussian
giveclassweight = True
givesampleweight = True
n_splits = 5 # cross validation folds
LocalCrossValidation = False # Performs Cross validation on local models with n_splits
Case = 'Classification' # Classification or Regression
importance_threshold = 0 # Removes less important features from Global Model
InBagSamples = 0.6 # from 0.5 to 0.9 for local models weighted bootstrapping
AnalyzeResiduales = False
plotFeatureImportance = False
exportLocalFeatureImportanceSHP = False
DatasetToAnalyze = 'Main' # Main , Distance, WindowsWMe, WindowsMVEM
################### Import the dataset #####################

os.chdir("D:/University/DustStorming/ToAli/DustStormModeling/For training/")

if DatasetToAnalyze == 'Main':
    dustsourcespickle = 'df_dustsources_WS0_X_0_PN20_SP___WS'
elif DatasetToAnalyze == 'Distance':
    dustsourcespickle = 'df_dustsources_WS0_X_0_PN20_SP__Dist_WS'
elif DatasetToAnalyze == 'WindowsWMe':
    dustsourcespickle = 'df_dustsources_WS7_X_7_PN20_SP_WMe___WS'
elif DatasetToAnalyze == 'WindowsMVEM':
    dustsourcespickle = 'df_dustsources_WS7_X_7_PN20_SP_Var_Med_Ent_Mod__WS'

dataset = pk.load(open(f'{dustsourcespickle}.pickle', 'rb'))
dataset = dataset.dropna()

dataset.reset_index(drop=True, inplace=True)


if DatasetToAnalyze == 'Main':
    dataset = dataset.drop(columns=['Year', 'Profile_curvature', 'Plan_curvature'])
elif DatasetToAnalyze == 'Distance':
    dataset = dataset.drop(columns=['Year', 'Profile_curvature', 'Plan_curvature',
                                    'Lakes','soil_type_Silt',
                                    'landcover_Cropland','landcover_Natural_vegetation'])
elif DatasetToAnalyze == 'WindowsWMe':
    dataset = dataset.drop(columns=['Year', 'Lakes', 'Precipitation wmean', 'Aspect', 'Curvature', 'landcover_Cropland',
                                    'soil_type_Clay_Loam', 'soil_type_Loam_Sand', 'soil_type_Sand_Clay_Loam',
                                    'soil_type_Sand_Loam', 'soil_type_Silt', 'Profile_curvature', 'Plan_curvature',
                                    'Plan_curvature wmean', 'Profile_curvature wmean'])

elif DatasetToAnalyze == 'WindowsMVEM':
    dataset = dataset.drop(columns=['Soil_evaporation median', 'Lakes', 'Lakes entropy', 'Lakes mode',
                                    'landcover mode', 'Precipitation',
                                    'Precipitation variance', 'Precipitation median', 'NDVI variance', 'Aspect',
                                    'Aspect variance', 'Aspect median', 'Curvature', 'Curvature median',
                                    'Distance_to_river variance',
                                    'Slope', 'Slope variance', 'Slope median',
                                    'Wind_Speed variance', 'landcover_Cropland', 'landcover_Natural_vegetation',
                                    'soil_type_Clay_Loam', 'soil_type_Loam_Sand',
                                    'soil_type_Sand_Clay_Loam', 'soil_type_Sand_Loam',
                                    'soil_type_Silt','Plan_curvature', 'Plan_curvature variance',
                                   'Plan_curvature median', 'Profile_curvature',
                                   'Profile_curvature variance', 'Profile_curvature median'])


# Assuming 'dust_storm' is the column you want to exclude
columns_to_scale = [col for col in dataset.columns if col not in ['dust_storm','Lakes','X','Y']]


# Initialize the MinMaxScaler
scaler = MinMaxScaler()

# Fit and transform the specified columns
dataset[columns_to_scale] = scaler.fit_transform(dataset[columns_to_scale])
Global_test_accuracy = []
Global_test_precission = []
GWML_test_accuracy = []
GWML_test_precission = []

Global_val_accuracy = []
Global_val_precission = []
GWML_val_accuracy = []
GWML_val_precission = []

numbers = [x / 100 for x in range(1, 51)]

for num in numbers:

    # Step 2: Generate random indices for 10% of the dataframe
    num_samples = int(len(dataset) * num)  # 10% of dataframe size
    random_indices = np.random.choice(dataset.index, num_samples, replace=False)

    Vdf = dataset.loc[random_indices]
    Vcoords = Vdf[['X', 'Y']]
    Vdf = Vdf.drop(columns=['X', 'Y'])

    df = dataset.drop(random_indices)
    coords = df[['X', 'Y']]
    df = df.drop(columns=['X', 'Y'])
    dframe = df.copy()

    X = df.drop(['dust_storm'], axis=1)
    y = df['dust_storm']

    # Split the training data into train and validation sets (80% train, 20% validation)
    X_train, X_test, y_train, y_test = train_test_split(X,y,test_size=0.2,random_state=0,stratify=y)

    if Case == 'Classification':
        print('############ Global model Metrics, binary classification #############')

        if AnalyzeResiduales:
            # Initialize the logistic regression model
            LinearModel = LogisticRegression()

            # Train the model on the training data
            LinearModel.fit(X_train, y_train)

            # Make predictions on the testing data
            predictions = LinearModel.predict(X_test)

            # Evaluate the model
            accuracy = accuracy_score(y_test, predictions)
            residual = y_test - predictions
            print(f'Accuracy of Linear Global model is {accuracy * 100}')
            # Find indices where residual is not equal to 0
            Nonlinearindices = np.where(residual != 0)[0]
            X_residuals = X_test.iloc[Nonlinearindices]
            y_residuals = y_test.iloc[Nonlinearindices]


        # Additional stopping parameters
        params = {
            'colsample_bytree': 0.7184927928953414,
            'gamma': 0.9916393575027221,
            'learning_rate': 0.2711585728111926,
            'max_depth': 9,
            'n_estimators': 99,
            'reg_alpha': 0.6994839362721395,
            'reg_lambda': 0.7763745385459733,
            'subsample': 0.9125483143121087
        }


        Gl_Model = xgb.XGBClassifier(objective='binary:logistic', eval_metric='logloss', **params)
        Gl_Model.fit(X_train, y_train)

        y_pred = Gl_Model.predict(X_test)

        # Perform cross-validation
        cv_scores = cross_val_score(Gl_Model, X_train, y_train, cv=n_splits,scoring='accuracy')  # Change cv value as needed

        # Print the cross-validation scores
        print("Accuracy Cross-validation scores:", cv_scores)
        print("Mean CV Score fro Accuracy:", cv_scores.mean())

        # Calculate evaluation metrics
        conf_matrix = confusion_matrix(y_test, y_pred)
        accuracy = accuracy_score(y_test, y_pred)
        precision = precision_score(y_test, y_pred)
        recall = recall_score(y_test, y_pred)
        f1 = f1_score(y_test, y_pred)
        auc = roc_auc_score(y_test, y_pred)

        # Print evaluation metrics
        # Print the metrics
        print("Accuracy: {:.2f}%".format(accuracy * 100))
        print("Precision: {:.2f}%".format(precision * 100))
        print("Recall: {:.2f}%".format(recall * 100))
        print("F1-score: {:.2f}%".format(f1 * 100))
        print('Confusion matrix:\n True negative: %s \
                  \n False positive: %s \n False negative: %s \n True positive: %s'
              % (conf_matrix[0, 0], conf_matrix[0, 1], conf_matrix[1, 0], conf_matrix[1, 1]))
        print('AUC: {:.2f}%'.format(auc * 100))

        feature_importances = Gl_Model.feature_importances_ * 100

        feature_names = X_train.columns

        # Sort features based on their importance
        sorted_indices = np.argsort(feature_importances)[::-1]
        sorted_feature_importances = feature_importances[sorted_indices]
        sorted_feature_names = [feature_names[i] for i in sorted_indices]

        if plotFeatureImportance:
            # Plotting
            plt.figure(figsize=(10, 6))
            plt.bar(range(len(feature_importances)), sorted_feature_importances, align="center")
            plt.xticks(range(len(feature_importances)), sorted_feature_names, rotation=45, ha='right')
            plt.xlabel("Feature")
            plt.ylabel("Feature Importance (%)")
            plt.title("Feature Importance Plot")
            plt.tight_layout()
            plt.show()


        # Identify columns with low importance
        low_importance_columns = X_train.columns[feature_importances < importance_threshold]

    elif Case =='Regression':
        print('############ Global model Metrics, Regression #############')

        if AnalyzeResiduales:
            # Initialize the logistic regression model
            LinearModel = LogisticRegression()

            # Train the model on the training data
            LinearModel.fit(X_train, y_train)

            # Make predictions on the testing data
            predictions = LinearModel.predict(X_test)

            # Evaluate the model
            accuracy = accuracy_score(y_test, predictions)
            residual = y_test - predictions

            # Find indices where residual is not equal to 0
            Nonlinearindices = np.where(residual != 0)[0]
            X_residuals = X_test.iloc[Nonlinearindices]
            y_residuals = y_test.iloc[Nonlinearindices]

        # Additional stopping parameters for regression
        params = {
            'colsample_bytree': 0.9247455836661762,
            'gamma': 0.29820290176358466,
            'learning_rate': 0.027168933983876396,
            'max_depth': 6,
            'n_estimators': 237,
            'reg_alpha': 0.8804846994706799,
            'reg_lambda': 0.028063747200209987,
            'subsample': 0.5701708183796725
        }

        Gl_Model = xgb.XGBRegressor(objective='reg:squarederror', **params)
        Gl_Model.fit(X_train, y_train)

        y_pred = Gl_Model.predict(X_test)

        # Perform cross-validation
        cv_scores = cross_val_score(Gl_Model, X_train, y_train, cv=n_splits,scoring=make_scorer(mean_squared_error))  # Change cv value as needed

        # Print the cross-validation scores
        print("Mean Squared Error Cross-validation scores:", cv_scores)
        print("Mean CV Score for Mean Squared Error:", cv_scores.mean())

        # Calculate evaluation metrics
        mse = mean_squared_error(y_test, y_pred)
        mae = mean_absolute_error(y_test, y_pred)
        r2 = r2_score(y_test, y_pred)

        # Print evaluation metrics
        print("Mean Squared Error (MSE): {:.2f}".format(mse))
        print("Mean Absolute Error (MAE): {:.2f}".format(mae))
        print("R-squared (R2): {:.2f}".format(r2))

        threshold = 0.5
        y_pred_binary = (y_pred > threshold).astype(int)

        # Calculate evaluation metrics
        accuracy = accuracy_score(y_test, y_pred_binary)
        precision = precision_score(y_test, y_pred_binary)
        recall = recall_score(y_test, y_pred_binary)
        f1 = f1_score(y_test, y_pred_binary)
        auc = roc_auc_score(y_test, y_pred)
        conf_matrix = confusion_matrix(y_test, y_pred_binary)

        # Print confusion matrix
        print('Confusion matrix:\n', conf_matrix)

        # Print evaluation metrics
        print("Accuracy: {:.2f}%".format(accuracy * 100))
        print("Precision: {:.2f}%".format(precision * 100))
        print("Recall: {:.2f}%".format(recall * 100))
        print("F1-score: {:.2f}%".format(f1 * 100))
        print('AUC: {:.2f}%'.format(auc * 100))

        feature_importances = Gl_Model.feature_importances_ * 100

        feature_names = X_train.columns

        # Sort features based on their importance
        sorted_indices = np.argsort(feature_importances)[::-1]
        sorted_feature_importances = feature_importances[sorted_indices]
        sorted_feature_names = [feature_names[i] for i in sorted_indices]

        if plotFeatureImportance:
            # Plotting
            plt.figure(figsize=(10, 6))
            plt.bar(range(len(feature_importances)), sorted_feature_importances, align="center")
            plt.xticks(range(len(feature_importances)), sorted_feature_names, rotation=45, ha='right')
            plt.xlabel("Feature")
            plt.ylabel("Feature Importance (%)")
            plt.title("Feature Importance Plot")
            plt.tight_layout()
            plt.show()

        # Identify columns with low importance
        low_importance_columns = X_train.columns[feature_importances < importance_threshold]

    df_local = dframe.drop(low_importance_columns, axis=1)
    df_local['pointID'] = df_local.index

    # Calculate pairwise distances
    distance_array = pdist(coords)

    # Convert the pairwise distances to a square matrix
    Dij = squareform(distance_array)

    if kernel == 'adaptive':
        Ne = bw
        print(f"Kernel: Adaptive\nNeighbours: {Ne}")
    elif kernel == 'fixed':
        print(f"Kernel: Fixed\nBandwidth: {bw}")

    def bootstrapWeighted(X_train,y_train,case_weights,mincatobs,InBagSamples,n_splits):
        # Calculate the number of samples to select
        num_samples = len(X_train)

        # Calculate the number of samples to be included in the bootstrap sample (70%)
        num_bootstrap_samples = int(InBagSamples * num_samples)

        # Select InBagSmples of indices with replacement based on case weights
        bootstrap_indices = np.random.choice(X_train.index, num_bootstrap_samples, replace=True,
                                             p=case_weights / np.sum(case_weights))

        oob_indices = np.setdiff1d(X_train.index, bootstrap_indices)

        # In bag X and y
        X_train_weighted = X_train.loc[bootstrap_indices]
        y_train_weighted = y_train.loc[bootstrap_indices]

        while 0 not in X_train_weighted['DNeighbour'].values:
            # Select the first InBagSamples of indices without replacement based on case weights
            bootstrap_indices = np.random.choice(X_train.index, num_bootstrap_samples, replace=True,
                                                 p=case_weights / np.sum(case_weights))
            # The remaining of indices are for OOB
            oob_indices = np.setdiff1d(X_train.index, bootstrap_indices)

            # In bag X and y
            X_train_weighted = X_train.loc[bootstrap_indices]
            y_train_weighted = y_train.loc[bootstrap_indices]

        value_counts = y_train_weighted.value_counts()
        min_category = y_train.value_counts().idxmin()
        if len(value_counts) < 2 or y_train_weighted.value_counts().get(min_category, 0) < n_splits+1:

            # Ensure that the indices to remove contain rows with max_category
            min_category_indices = np.random.choice(y_train[y_train == min_category].index,n_splits+1,replace=False)

            # Append min_category_indices to X_train_weighted and y_train_weighted
            X_train_weighted = pd.concat([X_train_weighted, X_train.loc[min_category_indices]])
            y_train_weighted = pd.concat([y_train_weighted, y_train.loc[min_category_indices]])

            # Remove min_category_indices from oob_indices
            oob_indices = np.setdiff1d(oob_indices, min_category_indices)

            # Add min_category_indices to bootstrap_indices
            bootstrap_indices = np.concatenate((bootstrap_indices, min_category_indices))

        # Save out-of-bag samples
        X_OOB = X_train.loc[oob_indices]
        y_OOB = y_train.loc[oob_indices]

        # Onlu in Bag Spatial Weighted
        spatial_weights = case_weights.loc[bootstrap_indices]

        # Weighted Bootstrapping outputs
        return X_train_weighted, y_train_weighted, X_OOB, y_OOB, spatial_weights

    obs = len(df_local)

    # Add 'pointID' column to 'dframe'

    coords['pointID'] = df_local['pointID']

    prediction_df = pd.DataFrame(columns=['PointID', 'y_test_l', 'y_pred_l', 'TruePositive',
                                          'TrueNegative', 'FalsePositive', 'FalseNegative'])

    Validation_OOB_df = pd.DataFrame(columns=['PointID', 'y_OOB', 'y_validation_OOB', 'TruePositive',
                                          'TrueNegative', 'FalsePositive', 'FalseNegative'])


    layered_df_dict = {}
    local_models = {}
    Feature_Importance_l = {}
    local_model_accuracy_l = {}
    Local_models_cv = []


    for m in range(0,obs):
        # Get the data
        DNeighbour = Dij[:, m]

        #### Create a new DataFrame 'DataSet' with 'df_local' and 'DNeighbour'
        DataSet = df_local.copy()
        DataSet['DNeighbour'] = DNeighbour
        # Sort by distance
        DataSetSorted = DataSet.sort_values(by='DNeighbour')
        if kernel == 'adaptive':
            cc = 1
            # Keep Nearest Neighbours
            SubSet = DataSetSorted.iloc[:Ne, :]
        elif kernel == 'fixed':
            SubSet = DataSetSorted[DataSetSorted['DNeighbour'] <= bw]
            Kernel_H = bw

        # Make sure there is at least one type of both labels in the subset
        while len(SubSet['dust_storm'].unique()) < 2 or SubSet['dust_storm'].value_counts()[0] < mincatobs or SubSet['dust_storm'].value_counts()[1] < mincatobs:
            SubSet = DataSetSorted.iloc[:Ne + cc, :]
            cc += 1
        if cc > 1:
            # before_removal_coords = pd.merge(SubSet, coords, on='pointID', how='left')

            # Plot KDE plot
            # plt.figure(figsize=(10, 6))
            # sns.kdeplot(data=SubSet, x='DNeighbour', fill=True)
            # plt.title('Probability Distribution of DNeighbour')
            # plt.xlabel('DNeighbour')
            # plt.ylabel('Probability Density')
            # plt.show()

            value_counts = SubSet['dust_storm'].value_counts()
            max_category = value_counts.idxmax()

            # Calculate the probabilities based on 'DNeighbour'
            probabilities = SubSet['DNeighbour'] / SubSet['DNeighbour'].sum()

            # Ensure that the indices to remove contain rows with max_category
            max_category_indices = SubSet[SubSet['dust_storm'] == max_category].index
            # Generate random indices with higher probability for higher 'DNeighbour' values
            remove_indices = np.random.choice(max_category_indices,
                                              size=len(max_category_indices) - (bw - mincatobs),
                                              replace=False,
                                              p=probabilities.loc[max_category_indices] /
                                                probabilities.loc[max_category_indices].sum())


            # Remove the selected rows
            SubSet = SubSet.drop(remove_indices)

            # Plot KDE plot
            # plt.figure(figsize=(10, 6))
            # sns.kdeplot(data=SubSet, x='DNeighbour', fill=True)
            # plt.title('Probability Distribution of DNeighbour')
            # plt.xlabel('DNeighbour')
            # plt.ylabel('Probability Density')
            # plt.show()

        if kernel == 'adaptive':
            Kernel_H = SubSet['DNeighbour'].max()
        elif kernel == 'fixed':
            Kernel_H = bw

        after_removal_coords = pd.merge(SubSet, coords, on='pointID', how='left')
        layered_df_dict[SubSet.loc[SubSet['DNeighbour'] == 0, 'pointID'].values[0]] = after_removal_coords

        # # Plotting latitude and longitude coordinates
        # plt.figure(figsize=(10, 8))
        # plt.scatter(after_removal_coords['X'], after_removal_coords['Y'], c=after_removal_coords['dust_storm'],
        #             cmap='coolwarm', s=50, alpha=0.7, label='dust_storm')
        # plt.scatter(after_removal_coords['X'].iloc[0], after_removal_coords['Y'].iloc[0], color='red', marker='*', s=200,
        #             label='First Point')
        # plt.title('Scatter Plot of Latitude and Longitude Coordinates')
        # plt.xlabel('Longitude')
        # plt.ylabel('Latitude')
        # plt.grid(True)
        # plt.legend()
        # plt.show()

        #### Split training and test data for the local models
        X_l = SubSet.drop(['dust_storm'], axis=1)
        y_l = SubSet['dust_storm']
        X_train_l, X_test_l, y_train_l, y_test_l = train_test_split(X_l, y_l, test_size=0.2, random_state=0, stratify=y_l)

        # Make sure there is at least one type of both labels in the Training data
        # value_counts = y_train_l.value_counts()
        while len(y_train_l.unique()) < 2 or 0 not in X_train_l['DNeighbour'].values or y_train_l.value_counts().values[y_train_l.value_counts().idxmin()] < math.floor(0.8*mincatobs) :
            random_integer = random.randint(0, 123)
            X_train_l, X_test_l, y_train_l, y_test_l = train_test_split(X_l, y_l, test_size=0.2,
                                                                        random_state=random_integer, stratify=y_l)

        # Bi-square weights
        if LocalSoatialWeight == 'Bi-square':
            Wts_train = (1 - (X_train_l['DNeighbour'] / Kernel_H) ** 2) ** 2
        elif LocalSoatialWeight == 'Guassian':
            Wts_train = np.exp(-(X_train_l['DNeighbour']**2) / (2 * Kernel_H**2))

        #### Use bootstrapWeighted to get weighted samples
        (X_train_l_weighted, y_train_l_weighted,
         X_OOB, y_OOB, case_weights) = bootstrapWeighted(X_train_l,
                                                         y_train_l,
                                                         Wts_train,
                                                         mincatobs,
                                                         InBagSamples,
                                                         n_splits)

        # Drop pointID
        # X_train_l_main_noPID = X_train_l.drop(['pointID'], axis=1)
        X_train_l_noPID = X_train_l_weighted.drop(['pointID','DNeighbour'], axis=1)
        X_test_l_noPID = X_test_l.drop(['pointID','DNeighbour'], axis=1)
        X_OOB_noPID = X_OOB.drop(['pointID','DNeighbour'], axis=1)
        X_train_l_main_noPID = X_train_l.drop(['pointID','DNeighbour'], axis=1)


        if Case == 'Classification':
            #### Class Weights
            # Calculate class weights
            # num_class_0_train = sum(y_train_l_weighted == 0)
            # num_class_1_train = sum(y_train_l_weighted == 1)
            # num_class_total = num_class_0_train + num_class_1_train
            #
            # weight_class_0_train = (num_class_total / (2 * num_class_0_train)) * 100
            # weight_class_1_train = (num_class_total / (2 * num_class_1_train)) * 100
            #
            # weight_class_0_normalized = weight_class_0_train / (weight_class_0_train + weight_class_1_train)
            # weight_class_1_normalized = weight_class_1_train / (weight_class_0_train + weight_class_1_train)
            #
            # # Create a dictionary of class weights
            # # class_weights = {0: weight_class_0_normalized, 1: weight_class_1_normalized}
            # class_weights = {0: weight_class_0_train, 1: weight_class_1_train}
            # if giveclassweight:
            #     params['class_weight'] = class_weights
            # else:
            #     params['class_weight'] = None
            # params['bootstrap'] = False
            # params['max_samples'] = None

            case_weights_float = case_weights.astype(float)
            #### Randomforest classifier
            LO_Model = xgb.XGBClassifier(objective='binary:logistic', eval_metric='logloss', **params)
            # FIT THE MODEL TO THE TRAINING DATA
            # , sample_weight = case_weights_float
            if givesampleweight:
                LO_Model.fit(X_train_l_noPID, y_train_l_weighted, sample_weight = case_weights_float)
            else:
                LO_Model.fit(X_train_l_noPID, y_train_l_weighted)
            # LO_Model.fit(X_train_l_main_noPID, y_train_l,sample_weight = Wts_train)

            #### TEST PREDICTION
            y_pred_l = LO_Model.predict(X_test_l_noPID)
            local_model_accuracy = accuracy_score(y_test_l, y_pred_l)
            local_models[SubSet.loc[SubSet['DNeighbour'] == 0, 'pointID'].values[0]] = LO_Model
            if LocalCrossValidation:
                #Perform cross-validation
                cv_scores = cross_val_score(LO_Model, X_train_l_noPID, y_train_l_weighted, cv=n_splits, scoring='accuracy')
                prediction_cv = cv_scores.mean()
                Local_models_cv.append(prediction_cv)
            else:
                prediction_cv = 0
                Local_models_cv.append(prediction_cv)
        elif Case == 'Regression':
            # params['bootstrap'] = False
            # params['max_samples'] = None
            LO_Model = xgb.XGBRegressor(objective='reg:squarederror', **params)
            # FIT THE MODEL TO THE TRAINING DATA
            # , sample_weight = case_weights_float
            LO_Model.fit(X_train_l_noPID, y_train_l_weighted)
            # LO_Model.fit(X_train_l_main_noPID, y_train_l,sample_weight = Wts_train)

            #### TEST PREDICTION
            y_pred_regression = LO_Model.predict(X_test_l_noPID)
            y_pred_l = (y_pred_regression > threshold).astype(int)
            local_model_accuracy = accuracy_score(y_test_l, y_pred_l)

            local_models[SubSet.loc[SubSet['DNeighbour'] == 0, 'pointID'].values[0]] = LO_Model

            if LocalCrossValidation:
                # Perform cross-validation
                cv_scores = cross_val_score(LO_Model, X_train_l_noPID, y_train_l_weighted, cv=n_splits, scoring=make_scorer(mean_squared_error))
                prediction_cv =  cv_scores.mean()
                Local_models_cv.append(prediction_cv)
            else:
                prediction_cv = 0
                Local_models_cv.append(prediction_cv)

        feature_importances_local = LO_Model.feature_importances_ * 100
        Feature_Importance_l[SubSet.loc[SubSet['DNeighbour'] == 0, 'pointID'].values[0]] = feature_importances_local
        local_model_accuracy_l[SubSet.loc[SubSet['DNeighbour'] == 0, 'pointID'].values[0]] = local_model_accuracy

        prediction_row = pd.DataFrame({'PointID': X_test_l['pointID'],
                                       'y_test_l': y_test_l,
                                       'y_pred_l': y_pred_l,
                                       'TruePositive': 0,
                                       'TrueNegative': 0,
                                       'FalsePositive': 0,
                                       'FalseNegative': 0}, )

        prediction_df = pd.concat([prediction_df, prediction_row], ignore_index=True)

        #### OUT OF BAG VALDIATION
        if Case == 'Classification':
            y_validation_OOB = LO_Model.predict(X_OOB_noPID)
        elif Case == 'Regression':
            y_validation_OOB_regression = LO_Model.predict(X_OOB_noPID)
            y_validation_OOB = (y_validation_OOB_regression > threshold).astype(int)


        validation_OOB_row = pd.DataFrame({'PointID': X_OOB['pointID'],
                                           'y_OOB': y_OOB,
                                           'y_validation_OOB': y_validation_OOB,
                                           'TruePositive': 0,
                                           'TrueNegative': 0,
                                           'FalsePositive': 0,
                                           'FalseNegative': 0}, )
        Validation_OOB_df = pd.concat([Validation_OOB_df, validation_OOB_row], ignore_index=True)
        # if m == [200, 500, 800, 1000, 1200, 1500, 1700]:
        print(m)

    print('############ Local model Metrics PREDICTION #############')

    # Calculate True Positive, True Negative, False Positive, False Negative for each row
    for index, row in prediction_df.iterrows():
        if row['y_test_l'] == 1 and row['y_pred_l'] == 1:
            prediction_df.at[index, 'TruePositive'] = 1
        elif row['y_test_l'] == 0 and row['y_pred_l'] == 0:
            prediction_df.at[index, 'TrueNegative'] = 1
        elif row['y_test_l'] == 0 and row['y_pred_l'] == 1:
            prediction_df.at[index, 'FalsePositive'] = 1
        elif row['y_test_l'] == 1 and row['y_pred_l'] == 0:
            prediction_df.at[index, 'FalseNegative'] = 1


    # Group by PointID and sum the values for each group
    aggregated_df = prediction_df.groupby('PointID').agg({
        'TruePositive': 'sum',
        'TrueNegative': 'sum',
        'FalsePositive': 'sum',
        'FalseNegative': 'sum'
    }).reset_index()

    aggregated_df['MajorityClass'] = aggregated_df[['TruePositive', 'TrueNegative', 'FalsePositive', 'FalseNegative']].idxmax(axis=1)


    # Calculate counts for TruePositive, TrueNegative, FalsePositive, and FalseNegative
    tp_count = aggregated_df['MajorityClass'].value_counts().get('TruePositive', 0)
    tn_count = aggregated_df['MajorityClass'].value_counts().get('TrueNegative', 0)
    fp_count = aggregated_df['MajorityClass'].value_counts().get('FalsePositive', 0)
    fn_count = aggregated_df['MajorityClass'].value_counts().get('FalseNegative', 0)

    # Create a confusion matrix DataFrame
    confusion_matrix_local = pd.DataFrame({
        'Predicted_Positive': [tp_count, fp_count],
        'Predicted_Negative': [fn_count, tn_count]
    }, index=['Actual_Positive', 'Actual_Negative'])

    # Print or display the confusion matrix
    print('Confusion Matrix for Prediction')
    print(confusion_matrix_local)

    TP_L = tp_count
    TN_L = tn_count
    FP_L = fp_count
    FN_L = fn_count

    # Calculate performance metrics
    accuracy_local = (TP_L + TN_L) / (TP_L + TN_L + FP_L + FN_L)
    precision_local = TP_L / (TP_L + FP_L)
    recall_local = TP_L / (TP_L + FN_L)
    f1_local = 2 * precision_local * recall_local / (precision_local + recall_local)

    local_CV_score = np.mean(Local_models_cv)

    # Print or display the calculated metrics
    print("Accuracy: {:.2f}".format(accuracy_local*100))
    print("Precision: {:.2f}".format(precision_local*100))
    print("Recall: {:.2f}".format(recall_local*100))
    print("F1 Score: {:.2f}".format(f1_local*100))
    print(f"{n_splits} fold cross validation score = {local_CV_score}")


    print('############ Local model Metrics OOB VALIDATION #############')

    # Calculate True Positive, True Negative, False Positive, False Negative for each row
    for index, row in Validation_OOB_df.iterrows():
        if row['y_OOB'] == 1 and row['y_validation_OOB'] == 1:
            Validation_OOB_df.at[index, 'TruePositive'] = 1
        elif row['y_OOB'] == 0 and row['y_validation_OOB'] == 0:
            Validation_OOB_df.at[index, 'TrueNegative'] = 1
        elif row['y_OOB'] == 0 and row['y_validation_OOB'] == 1:
            Validation_OOB_df.at[index, 'FalsePositive'] = 1
        elif row['y_OOB'] == 1 and row['y_validation_OOB'] == 0:
            Validation_OOB_df.at[index, 'FalseNegative'] = 1

    # Group by PointID and sum the values for each group
    aggregated_oob_df = Validation_OOB_df.groupby('PointID').agg({
        'TruePositive': 'sum',
        'TrueNegative': 'sum',
        'FalsePositive': 'sum',
        'FalseNegative': 'sum'
    }).reset_index()

    aggregated_oob_df['MajorityClass'] = aggregated_oob_df[['TruePositive', 'TrueNegative', 'FalsePositive', 'FalseNegative']].idxmax(axis=1)

    # Calculate counts for TruePositive, TrueNegative, FalsePositive, and FalseNegative
    tp_count_OOB = aggregated_oob_df['MajorityClass'].value_counts().get('TruePositive', 0)
    tn_count_OOB = aggregated_oob_df['MajorityClass'].value_counts().get('TrueNegative', 0)
    fp_count_OOB = aggregated_oob_df['MajorityClass'].value_counts().get('FalsePositive', 0)
    fn_count_OOB = aggregated_oob_df['MajorityClass'].value_counts().get('FalseNegative', 0)


    # Create a confusion matrix DataFrame
    confusion_matrix_local_OOB = pd.DataFrame({
        'Predicted_Positive': [tp_count_OOB, fp_count_OOB],
        'Predicted_Negative': [fn_count_OOB, tn_count_OOB]
    }, index=['Actual_Positive', 'Actual_Negative'])


    # Print or display the confusion matrix
    print('Confusion Matrix for OOB')
    print(confusion_matrix_local_OOB)

    TP_L_OOB = tp_count_OOB
    TN_L_OOB = tn_count_OOB
    FP_L_OOB = fp_count_OOB
    FN_L_OOB = fn_count_OOB

    # Calculate performance metrics
    accuracy_local_OOB = (TP_L_OOB + TN_L_OOB) / (TP_L_OOB + TN_L_OOB + FP_L_OOB + FN_L_OOB)
    precision_local_OOB = TP_L_OOB / (TP_L_OOB + FP_L_OOB)
    recall_local_OOB = TP_L_OOB / (TP_L_OOB + FN_L_OOB)
    f1_local_OOB = 2 * precision_local_OOB * recall_local_OOB / (precision_local_OOB + recall_local_OOB)


    # Print or display the calculated metrics
    print("OOB Accuracy: {:.2f}%".format(accuracy_local_OOB*100))
    print("OOB Precision: {:.2f}".format(precision_local_OOB*100))
    print("OOB Recall: {:.2f}".format(recall_local_OOB*100))
    print("OOB F1 Score: {:.2f}".format(f1_local_OOB*100))

    if exportLocalFeatureImportanceSHP:
        temp_df = df_local.drop(['pointID', 'dust_storm'], axis=1)
        ExportDF = pd.DataFrame()
        Localfeature_df = pd.DataFrame.from_dict(Feature_Importance_l , orient='index', columns=temp_df.columns)
        Localaccuracy_df = pd.DataFrame.from_dict(local_model_accuracy_l , orient='index', columns=['Accuracy'])
        ExportDF = pd.concat([coords, Localfeature_df,Localaccuracy_df], axis=1)

        # Convert latitude and longitude to a Point geometry
        geometry = [Point(xy) for xy in zip(ExportDF['X'], ExportDF['Y'])]

        # Create a GeoDataFrame
        gdf = gpd.GeoDataFrame(ExportDF, geometry=geometry)

        # Set the coordinate reference system (CRS) if needed
        # For example, setting it to WGS 84 (EPSG:4326)
        gdf.crs = from_epsg(4326)

        # Save the GeoDataFrame as a shapefile
        output_shapefile = f'GWML_XGBoost_{Case}.shp'
        gdf.to_file(output_shapefile, driver='ESRI Shapefile')

        # Optionally, you can also create a .prj file to specify the CRS
        with open(output_shapefile.replace('.shp', '.prj'), 'w') as f:
            f.write(gdf.crs.to_wkt())


    print('################ Models evaluation #############')
    X_evaluate = Vdf.drop(['dust_storm'], axis=1)
    y_evaluate = Vdf['dust_storm']
    if Case == 'Classification':
        Global_model_y_predict = Gl_Model.predict(X_evaluate)
        if AnalyzeResiduales:
            Linear_model_y_predict = LinearModel.predict(X_evaluate)
    elif Case == 'Regression':
        Global_model_y_predict_ = Gl_Model.predict(X_evaluate)
        Global_model_y_predict = (Global_model_y_predict_ > threshold).astype(int)
        if AnalyzeResiduales:
            Linear_model_y_predict_ = LinearModel.predict(X_evaluate)
            Linear_model_y_predict = (Linear_model_y_predict_ > threshold).astype(int)
    Global_model_y_predict = pd.Series(Global_model_y_predict, index=X_evaluate.index).reindex(X_evaluate.index)
    if AnalyzeResiduales:
        Linear_model_y_predict = pd.Series(Linear_model_y_predict, index=X_evaluate.index).reindex(X_evaluate.index)


    # Calculate evaluation metrics
    conf_matrix_test = confusion_matrix(y_evaluate, Global_model_y_predict)
    accuracy_test = accuracy_score(y_evaluate, Global_model_y_predict)
    precision_test = precision_score(y_evaluate, Global_model_y_predict)
    recall_test = recall_score(y_evaluate, Global_model_y_predict)
    f1_test = f1_score(y_evaluate, Global_model_y_predict)
    auc_test = roc_auc_score(y_evaluate, Global_model_y_predict)

    # Print evaluation metrics
    print('Evaluate Global model #####')
    print("Accuracy: {:.2f}%".format(accuracy_test * 100))
    print("Precision: {:.2f}%".format(precision_test * 100))
    print("Recall: {:.2f}%".format(recall_test * 100))
    print("F1-score: {:.2f}%".format(f1_test * 100))
    print('Confusion matrix:\n True negative: %s \
              \n False positive: %s \n False negative: %s \n True positive: %s'
          % (conf_matrix_test[0, 0], conf_matrix_test[0, 1], conf_matrix_test[1, 0], conf_matrix_test[1, 1]))
    print('AUC: {:.2f}%'.format(auc_test * 100))

    print('Evaluate local model #####')

    # temp_df = df_local.drop(['pointID', 'dust_storm'], axis=1)
    # ExportDF = pd.DataFrame()
    # Localfeature_df = pd.DataFrame.from_dict(Feature_Importance_l , orient='index', columns=temp_df.columns)
    # Localaccuracy_df = pd.DataFrame.from_dict(local_model_accuracy_l , orient='index', columns=['Accuracy'])
    # ExportDF = pd.concat([coords, Localfeature_df,Localaccuracy_df], axis=1)

    X_evaluate_local = X_evaluate.drop(low_importance_columns, axis=1)

    prediction_df_final = pd.DataFrame(columns=['PointID', 'y_test_l', 'y_pred_l', 'TruePositive_l',
                                          'TrueNegative_l', 'FalsePositive_l', 'FalseNegative_l','NonLinear'])
    if AnalyzeResiduales:
        common_numbers = [num for num in layered_df_dict.keys() if num in Nonlinearindices]
    for Index in X_evaluate_local.index:

        X_prediction = X_evaluate_local.loc[[Index]]
        y_actual = y_evaluate.loc[Index]
        D = np.sqrt((Vcoords.loc[Index]['X'] - coords['X']) ** 2 + (Vcoords.loc[Index]['Y'] - coords['Y']) ** 2)
        for key, item in layered_df_dict.items():
            if D.loc[key] < np.max(layered_df_dict[key]['DNeighbour']):

                if Case == 'Classification':
                    y_prediction_local = local_models[key].predict(X_prediction)
                elif Case == 'Regression':
                    y_prediction_local_ = local_models[key].predict(X_prediction)
                    y_prediction_local = (y_prediction_local_ > threshold).astype(int)

                prediction_row_final = pd.DataFrame({'PointID': [X_prediction.index[0]],
                                                     'y_test_l': [y_actual],
                                                     'y_pred_l': [y_prediction_local[0]],
                                                     'TruePositive_l': 0,
                                                     'TrueNegative_l': 0,
                                                     'FalsePositive_l': 0,
                                                     'FalseNegative_l': 0,
                                                     'NonLinear': 0}, )
                if AnalyzeResiduales:
                    if key in common_numbers:
                        prediction_row_final['NonLinear'] = 1
                prediction_df_final = pd.concat([prediction_df_final, prediction_row_final], ignore_index=True)


            else:
                pass


    # Calculate True Positive, True Negative, False Positive, False Negative for each row
    for index, row in prediction_df_final.iterrows():
        if row['y_test_l'] == 1 and row['y_pred_l'] == 1:
            prediction_df_final.at[index, 'TruePositive_l'] = 1
        elif row['y_test_l'] == 0 and row['y_pred_l'] == 0:
            prediction_df_final.at[index, 'TrueNegative_l'] = 1
        elif row['y_test_l'] == 0 and row['y_pred_l'] == 1:
            prediction_df_final.at[index, 'FalsePositive_l'] = 1
        elif row['y_test_l'] == 1 and row['y_pred_l'] == 0:
            prediction_df_final.at[index, 'FalseNegative_l'] = 1


    # Group by PointID and sum the values for each group
    aggregated_df_final = prediction_df_final.groupby('PointID').agg({
        'TruePositive_l': 'sum',
        'TrueNegative_l': 'sum',
        'FalsePositive_l': 'sum',
        'FalseNegative_l': 'sum',
        'NonLinear': 'sum'
    }).reset_index()

    aggregated_df_final['MajorityClass'] = aggregated_df_final[['TruePositive_l', 'TrueNegative_l', 'FalsePositive_l', 'FalseNegative_l']].idxmax(axis=1)

    # Calculate counts for TruePositive, TrueNegative, FalsePositive, and FalseNegative
    tp_count_local_final = aggregated_df_final['MajorityClass'].value_counts().get('TruePositive_l', 0)
    tn_count_local_final = aggregated_df_final['MajorityClass'].value_counts().get('TrueNegative_l', 0)
    fp_count_local_final = aggregated_df_final['MajorityClass'].value_counts().get('FalsePositive_l', 0)
    fn_count_local_final = aggregated_df_final['MajorityClass'].value_counts().get('FalseNegative_l', 0)

    # Create a confusion matrix DataFrame
    confusion_matrix_local_final = pd.DataFrame({
        'Predicted_Positive': [tp_count_local_final, fp_count_local_final],
        'Predicted_Negative': [fn_count_local_final, tn_count_local_final]
    }, index=['Actual_Positive', 'Actual_Negative'])

    # Print or display the confusion matrix
    print('Confusion Matrix for Prediction')
    print(confusion_matrix_local_final)

    TP_local_final = tp_count_local_final
    TN_local_final = tn_count_local_final
    FP_local_final = fp_count_local_final
    FN_local_final = fn_count_local_final

    # Calculate performance metrics
    accuracy_local_final = (TP_local_final + TN_local_final) / (TP_local_final + TN_local_final + FP_local_final + FN_local_final)
    precision_local_final = TP_local_final / (TP_local_final + FP_local_final)
    recall_local_final = TP_local_final / (TP_local_final + FN_local_final)
    f1_local_final = 2 * precision_local_final * recall_local_final / (precision_local_final + recall_local_final)

    # Print or display the calculated metrics
    print("Accuracy: {:.2f}".format(accuracy_local_final*100))
    print("Precision: {:.2f}".format(precision_local_final*100))
    print("Recall: {:.2f}".format(recall_local_final*100))
    print("F1 Score: {:.2f}".format(f1_local_final*100))


    aggregated_df_final ['PID']= aggregated_df_final ['PointID']
    aggregated_df_final.set_index('PID', inplace=True)

    sorted_index = X_evaluate.index.intersection(aggregated_df_final.index).tolist()
    sorted_aggregated_df_final = aggregated_df_final.reindex(sorted_index)

    def map_predictions(row):
        if row['MajorityClass'] == 'TruePositive_l' or row['MajorityClass'] == 'FalsePositive_l':
            return 1
        else:
            return 0

    # Apply the function to create a new column with binary predictions
    sorted_aggregated_df_final['Binary_Predictions'] = sorted_aggregated_df_final.apply(map_predictions, axis=1)

    LastDataframe = pd.concat([Vdf['dust_storm'],Global_model_y_predict.rename('Global_Model'),sorted_aggregated_df_final['Binary_Predictions'],sorted_aggregated_df_final['PointID']], axis=1)
    threshold = 0.5
    LastDataframe['LinearCOmbination0.5'] = ((0.5 * LastDataframe['Global_Model'] + 0.5 * LastDataframe['Binary_Predictions'])> threshold).astype(int)
    LastDataframe['LinearCOmbination0.25'] = ((0.25 * LastDataframe['Global_Model'] + 0.75 * LastDataframe['Binary_Predictions'])> threshold).astype(int)
    LastDataframe['LinearCOmbination0.75'] = ((0.75 * LastDataframe['Global_Model'] + 0.25 * LastDataframe['Binary_Predictions'])> threshold).astype(int)


    # Calculate True Positives (TP)
    TP05 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.5'] == 1)).sum()
    TP025 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.25'] == 1)).sum()
    TP075 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.75'] == 1)).sum()

    # Calculate True Negatives (TN)
    TN05 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.5'] == 0)).sum()
    TN025 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.25'] == 0)).sum()
    TN075 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.75'] == 0)).sum()

    # Calculate False Positives (FP)
    FP05 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.5'] == 1)).sum()
    FP025 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.25'] == 1)).sum()
    FP075 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.75'] == 1)).sum()

    # Calculate False Negatives (FN)
    FN05 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.5'] == 0)).sum()
    FN025 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.25'] == 0)).sum()
    FN075 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.75'] == 0)).sum()

    # Calculate Accuracy
    accuracy05 = (TP05 + TN05) / (TP05 + TN05 + FP05 + FN05)
    accuracy025 = (TP025 + TN025) / (TP025 + TN025 + FP025 + FN025)
    accuracy075 = (TP075 + TN075) / (TP075 + TN075 + FP075 + FN075)

    print('################ Linear Combintion nof Global and local models')
    print(f'Accuracy for 0.5 weights for both Global and Local models = {accuracy05 * 100}')
    print(f'Accuracy for 0.25 weight for GLobal and 0.75 weight for Locals = {accuracy025 * 100}')
    print(f'Accuracy for 0.75 weight for GLobal and 0.25 weight for Locals = {accuracy075 * 100}')


    if AnalyzeResiduales:
        print('########### Combination of linear global model with nonlinear local models ######### ')
        LastLinearDataframe = pd.concat([Vdf['dust_storm'],Linear_model_y_predict.rename('Global_Model'),sorted_aggregated_df_final['Binary_Predictions'],sorted_aggregated_df_final['NonLinear'],sorted_aggregated_df_final['PointID']], axis=1)
        threshold = 0.5
        weight = sorted_aggregated_df_final['NonLinear']/np.sum(sorted_aggregated_df_final['NonLinear'])
        LastDataframe['LinearCOmbination'] = (((1- weight) * LastDataframe['Global_Model'] + weight * LastDataframe['Binary_Predictions'])> threshold).astype(int)

        # Calculate True Positives (TP)
        TP05 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.5'] == 1)).sum()

        # Calculate True Negatives (TN)
        TN05 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.5'] == 0)).sum()

        # Calculate False Positives (FP)
        FP05 = ((LastDataframe['dust_storm'] == 0) & (LastDataframe['LinearCOmbination0.5'] == 1)).sum()

        # Calculate False Negatives (FN)
        FN05 = ((LastDataframe['dust_storm'] == 1) & (LastDataframe['LinearCOmbination0.5'] == 0)).sum()

        # Calculate Accuracy
        accuracy05 = (TP05 + TN05) / (TP05 + TN05 + FP05 + FN05)

        print('################ Linear Combintion nof Global and local models')
        print(f'Accuracy for linear combination = {accuracy05 * 100}')

    Global_val_accuracy.append(accuracy)
    Global_val_precission.append(precision)
    GWML_val_accuracy.append(accuracy_local)
    GWML_val_precission.append(precision_local)

    Global_test_accuracy.append(accuracy_test)
    Global_test_precission.append(precision_test)
    GWML_test_accuracy.append(accuracy_local_final)
    GWML_test_precission.append(precision_local_final)
    print(f'############# The size of the test dataset{num/100} ##############')

print('finish')

# Plotting
fig, axes = plt.subplots(2, 2, figsize=(12, 8))

# Plot 1: Global Validation
axes[0, 0].plot(numbers, Global_val_accuracy, label='Global Validation Accuracy')
axes[0, 0].plot(numbers, Global_test_accuracy, label='Global test Accuracy')
axes[0, 0].set_xlabel('Test Dataset size')
axes[0, 0].set_ylabel('Accuracy')
axes[0, 0].set_title('Global Validation/Test')
axes[0, 0].legend()
axes[0, 0].grid(True)

# Plot 2: GWML Validation
axes[0, 1].plot(numbers, GWML_val_accuracy, label='GWML Validation Accuracy')
axes[0, 1].plot(numbers, GWML_test_accuracy, label='GWML test Accuracy')
axes[0, 1].set_xlabel('Test Dataset size')
axes[0, 1].set_ylabel('Accuracy')
axes[0, 1].set_title('GWML Validation/Test')
axes[0, 1].legend()
axes[0, 1].grid(True)

# Plot 3: Global Test
axes[1, 0].plot(numbers, Global_val_precission, label='Global Validation Precision')
axes[1, 0].plot(numbers, Global_test_precission, label='Global Test Precision')
axes[1, 0].set_xlabel('Test Dataset size')
axes[1, 0].set_ylabel('Precision')
axes[1, 0].set_title('Global Validation/Test')
axes[1, 0].legend()
axes[1, 0].grid(True)

# Plot 4: GWML Test
axes[1, 1].plot(numbers, GWML_val_precission, label='GWML Validation Precision')
axes[1, 1].plot(numbers, GWML_test_precission, label='GWML Test Precision')
axes[1, 1].set_xlabel('Test Dataset size')
axes[1, 1].set_ylabel('Precision')
axes[1, 1].set_title('GWML Validation/Test')
axes[1, 1].legend()
axes[1, 1].grid(True)

plt.tight_layout()
# plt.show()
plt.savefig('Test_Dataset_change_XGBoost.jpg')
plt.close()