From 6d80afbd9a4dc124daded2507b3925f7ccc40267 Mon Sep 17 00:00:00 2001
From: Mads Christian Lund <maclu@geus.dk>
Date: Mon, 19 Aug 2024 15:26:27 +0200
Subject: [PATCH] Applied black on join_l3

---
 src/pypromice/process/join_l3.py | 499 +++++++++++++++++++------------
 1 file changed, 309 insertions(+), 190 deletions(-)

diff --git a/src/pypromice/process/join_l3.py b/src/pypromice/process/join_l3.py
index 4e2c40f7..e528d8ef 100644
--- a/src/pypromice/process/join_l3.py
+++ b/src/pypromice/process/join_l3.py
@@ -6,6 +6,7 @@
 import numpy as np
 import pandas as pd
 import xarray as xr
+
 logging.basicConfig(
     format="%(asctime)s; %(levelname)s; %(name)s; %(message)s",
     level=logging.INFO,
@@ -13,155 +14,218 @@
 )
 logger = logging.getLogger(__name__)
 
+
 def parse_arguments_joinl3(debug_args=None):
-    parser = ArgumentParser(description="AWS L3 script for the processing L3 data from L2 and merging the L3 data with its historical site. An hourly, daily and monthly L3 data product is outputted to the defined output path")
-    parser.add_argument('-c', '--config_folder', type=str, required=True,
-                        help='Path to folder with sites configuration (TOML) files')
-    parser.add_argument('-s', '--site',  default=None, type=str, required=False,
-                        help='Name of site to process (default: all sites are processed)')
-
-    parser.add_argument('-l3', '--folder_l3', type=str, required=True, 
-                        help='Path to level 3 folder')
-    parser.add_argument('-gc', '--folder_gcnet', type=str, required=False, 
-                        help='Path to GC-Net historical L1 folder')
-
-    parser.add_argument('-o', '--outpath', default=os.getcwd(), type=str, required=True,
-                        help='Path where to write output')
-    
-    parser.add_argument('-v', '--variables', default=None, type=str, required=False, 
-    			 help='Path to variables look-up table .csv file for variable name retained'''),
-    parser.add_argument('-m', '--metadata', default=None, type=str, required=False, 
-    			 help='Path to metadata table .csv file for metadata information'''),
+    parser = ArgumentParser(
+        description="AWS L3 script for the processing L3 data from L2 and merging the L3 data with its historical site. An hourly, daily and monthly L3 data product is outputted to the defined output path"
+    )
+    parser.add_argument(
+        "-c",
+        "--config_folder",
+        type=str,
+        required=True,
+        help="Path to folder with sites configuration (TOML) files",
+    )
+    parser.add_argument(
+        "-s",
+        "--site",
+        default=None,
+        type=str,
+        required=False,
+        help="Name of site to process (default: all sites are processed)",
+    )
+
+    parser.add_argument(
+        "-l3", "--folder_l3", type=str, required=True, help="Path to level 3 folder"
+    )
+    parser.add_argument(
+        "-gc",
+        "--folder_gcnet",
+        type=str,
+        required=False,
+        help="Path to GC-Net historical L1 folder",
+    )
+
+    parser.add_argument(
+        "-o",
+        "--outpath",
+        default=os.getcwd(),
+        type=str,
+        required=True,
+        help="Path where to write output",
+    )
+
+    parser.add_argument(
+        "-v",
+        "--variables",
+        default=None,
+        type=str,
+        required=False,
+        help="Path to variables look-up table .csv file for variable name retained" "",
+    ),
+    parser.add_argument(
+        "-m",
+        "--metadata",
+        default=None,
+        type=str,
+        required=False,
+        help="Path to metadata table .csv file for metadata information" "",
+    ),
 
     args = parser.parse_args(args=debug_args)
     return args
 
+
 def readNead(infile):
     with open(infile) as f:
         fmt = f.readline()
-        assert(fmt[0] == "#")
-        assert(fmt.split("#")[1].split()[0] == "NEAD")
-        assert(fmt.split("#")[1].split()[1] == "1.0")
-        assert(fmt.split("#")[1].split()[2] == "UTF-8")
-        
+        assert fmt[0] == "#"
+        assert fmt.split("#")[1].split()[0] == "NEAD"
+        assert fmt.split("#")[1].split()[1] == "1.0"
+        assert fmt.split("#")[1].split()[2] == "UTF-8"
+
         line = f.readline()
-        assert(line[0] == "#")
-        assert(line.split("#")[1].strip() == '[METADATA]')
-    
+        assert line[0] == "#"
+        assert line.split("#")[1].strip() == "[METADATA]"
+
         meta = {}
         fields = {}
-        section = 'meta'
+        section = "meta"
         while True:
             line = f.readline()
-            if line.strip(' ') == '#': continue
-            if line == "# [DATA]\n": break # done reading header
+            if line.strip(" ") == "#":
+                continue
+            if line == "# [DATA]\n":
+                break  # done reading header
             if line == "# [FIELDS]\n":
-                section = 'fields'
-                continue # done reading header
-            
-            if line[0] == "\n": continue   # blank line
-            assert(line[0] == "#")         # if not blank, must start with "#"
-            
+                section = "fields"
+                continue  # done reading header
+
+            if line[0] == "\n":
+                continue  # blank line
+            assert line[0] == "#"  # if not blank, must start with "#"
+
             key_eq_val = line.split("#")[1].strip()
-            if key_eq_val == '' or key_eq_val == None: continue  # Line is just "#" or "# " or "#   #"...
-            assert("=" in key_eq_val), print(line, key_eq_val)
+            if key_eq_val == "" or key_eq_val == None:
+                continue  # Line is just "#" or "# " or "#   #"...
+            assert "=" in key_eq_val, print(line, key_eq_val)
             key = key_eq_val.split("=")[0].strip()
             val = key_eq_val.split("=")[1].strip()
-    
+
             # Convert from string to number if it is a number
-            if val.strip('-').strip('+').replace('.','').isdigit():
+            if val.strip("-").strip("+").replace(".", "").isdigit():
                 val = float(val)
                 if val == int(val):
                     val = int(val)
-    
-            if section == 'meta': meta[key] = val
-            if section == 'fields': fields[key] = val
+
+            if section == "meta":
+                meta[key] = val
+            if section == "fields":
+                fields[key] = val
         # done reading header
-    
+
         # Find delimiter and fields for reading NEAD as simple CSV
-        assert("field_delimiter" in meta.keys())
-        assert("fields" in fields.keys())
+        assert "field_delimiter" in meta.keys()
+        assert "fields" in fields.keys()
         FD = meta["field_delimiter"]
-        names = [_.strip() for _ in fields.pop('fields').split(FD)]
-    
-        df = pd.read_csv(infile,
-                         comment = "#",
-                         names = names,
-                         sep = FD,
-                         usecols=np.arange(len(names)),
-                         skip_blank_lines = True)
-        df['timestamp'] = pd.to_datetime(df.timestamp).dt.tz_localize(None)
-        df = df.set_index('timestamp')
+        names = [_.strip() for _ in fields.pop("fields").split(FD)]
+
+        df = pd.read_csv(
+            infile,
+            comment="#",
+            names=names,
+            sep=FD,
+            usecols=np.arange(len(names)),
+            skip_blank_lines=True,
+        )
+        df["timestamp"] = pd.to_datetime(df.timestamp).dt.tz_localize(None)
+        df = df.set_index("timestamp")
         ds = df.to_xarray()
         ds.attrs = meta
-        
+
         # renaming variables
         file_path = pypromice.resources.DEFAULT_VARIABLES_ALIASES_GCNET_PATH
         var_name = pd.read_csv(file_path)
-        var_name = var_name.set_index('old_name').GEUS_name
+        var_name = var_name.set_index("old_name").GEUS_name
         msk = [v for v in var_name.index if v in ds.data_vars]
         var_name = var_name.loc[msk].to_dict()
-        
+
         # combining thermocouple and CS100 temperatures
-        ds['TA1'] =  ds['TA1'].combine_first(ds['TA3'])
-        ds['TA2'] =  ds['TA2'].combine_first(ds['TA4'])
-        
+        ds["TA1"] = ds["TA1"].combine_first(ds["TA3"])
+        ds["TA2"] = ds["TA2"].combine_first(ds["TA4"])
+
         # renaming variables to the GEUS names
-        ds=ds.rename(var_name)
-        
+        ds = ds.rename(var_name)
+
         # variables always dropped from the historical GC-Net files
         # could be move to the config files at some point
-        standard_vars_to_drop = ["NR", "TA3", "TA4", "TA5",  "NR_cor", "TA2m",
-                                 "RH2m", "VW10m", "SZA", "SAA"]
-        standard_vars_to_drop = standard_vars_to_drop + [v for v in list(ds.keys()) if v.endswith("_adj_flag")]
+        standard_vars_to_drop = [
+            "NR",
+            "TA3",
+            "TA4",
+            "TA5",
+            "NR_cor",
+            "TA2m",
+            "RH2m",
+            "VW10m",
+            "SZA",
+            "SAA",
+        ]
+        standard_vars_to_drop = standard_vars_to_drop + [
+            v for v in list(ds.keys()) if v.endswith("_adj_flag")
+        ]
 
         # Drop the variables if they are present in the dataset
         ds = ds.drop_vars([var for var in standard_vars_to_drop if var in ds])
-        
-        ds=ds.rename({'timestamp':'time'})
-        
+
+        ds = ds.rename({"timestamp": "time"})
+
         # in the historical GC-Net processing, periods with missing z_surf_combined
-        # are filled with a constant value, these values should be removed to 
+        # are filled with a constant value, these values should be removed to
         # allow a better alignement with the z_surf_combined estimated for the GEUS stations
-        ds['z_surf_combined'] = ds['z_surf_combined'].where(ds['z_surf_combined'].diff(dim='time')!=0)
+        ds["z_surf_combined"] = ds["z_surf_combined"].where(
+            ds["z_surf_combined"].diff(dim="time") != 0
+        )
     return ds
 
+
 def loadArr(infile, isNead):
-    if infile.split('.')[-1].lower() in 'csv':
+    if infile.split(".")[-1].lower() in "csv":
         if isNead:
             ds = readNead(infile)
         else:
             df = pd.read_csv(infile)
-            df['time'] = pd.to_datetime(df['time']).dt.tz_localize(None)
-            df = df.set_index('time')
+            df["time"] = pd.to_datetime(df["time"]).dt.tz_localize(None)
+            df = df.set_index("time")
             ds = xr.Dataset.from_dataframe(df)
-            
-    elif infile.split('.')[-1].lower() in 'nc':
+
+    elif infile.split(".")[-1].lower() in "nc":
         with xr.open_dataset(infile) as ds:
             ds.load()
         # Remove encoding attributes from NetCDF
         for varname in ds.variables:
-            if ds[varname].encoding!={}:
+            if ds[varname].encoding != {}:
                 ds[varname].encoding = {}
-    
+
     try:
-        name = ds.attrs['station_name'] 
+        name = ds.attrs["station_name"]
     except:
-        name = infile.split('/')[-1].split('.')[0].split('_hour')[0].split('_10min')[0]
-        
-    print(f'{name} array loaded from {infile}')
+        name = infile.split("/")[-1].split(".")[0].split("_hour")[0].split("_10min")[0]
+
+    print(f"{name} array loaded from {infile}")
     return ds, name
 
+
 def align_surface_heights(data_series_new, data_series_old):
     """
     Align two surface height time series based on the gap between their end and
     start.
 
-    If the gap between the end of `data_series_old` and the start of `data_series_new` 
-    is less than a week, the function aligns them based on the median value of 
-    the last week of `data_series_old` and the first week of `data_series_new`. 
-    If the gap is larger than a week, it aligns them using a linear fit. If 
-    there is overlap, the function uses the overlapping period to adjust the 
+    If the gap between the end of `data_series_old` and the start of `data_series_new`
+    is less than a week, the function aligns them based on the median value of
+    the last week of `data_series_old` and the first week of `data_series_new`.
+    If the gap is larger than a week, it aligns them using a linear fit. If
+    there is overlap, the function uses the overlapping period to adjust the
     newer time series.
 
     Parameters
@@ -184,53 +248,62 @@ def align_surface_heights(data_series_new, data_series_old):
     if first_new_idx <= last_old_idx:
         # Find the overlapping period
         overlap_start = first_new_idx
-        overlap_end = min(last_old_idx, overlap_start+pd.to_timedelta('7D'))
-        
+        overlap_end = min(last_old_idx, overlap_start + pd.to_timedelta("7D"))
+
         # Compute the median values for the overlapping period
         overlap_old = data_series_old[overlap_start:overlap_end].median()
         overlap_new = data_series_new[overlap_start:overlap_end].median()
-        
+
         if np.isnan(overlap_old) or np.isnan(overlap_new):
             overlap_end = min(last_old_idx, data_series_new.last_valid_index())
-            
+
             # Compute the median values for the overlapping period
             overlap_old = data_series_old[overlap_start:overlap_end].median()
             overlap_new = data_series_new[overlap_start:overlap_end].median()
-                    
+
         # Align based on the overlapping median values
         data_series_new = data_series_new - overlap_new + overlap_old
-        
+
     elif (first_new_idx - last_old_idx).days <= 7:
         # Compute the median of the last week of data in the old series
-        last_week_old = data_series_old[last_old_idx - pd.Timedelta(weeks=1):last_old_idx].median()
-        
+        last_week_old = data_series_old[
+            last_old_idx - pd.Timedelta(weeks=1) : last_old_idx
+        ].median()
+
         # Compute the median of the first week of data in the new series
-        first_week_new = data_series_new[first_new_idx:first_new_idx + pd.Timedelta(weeks=1)].median()
-        
+        first_week_new = data_series_new[
+            first_new_idx : first_new_idx + pd.Timedelta(weeks=1)
+        ].median()
+
         # Align based on the median values
         data_series_new = data_series_new - first_week_new + last_week_old
     else:
         # Perform a linear fit on the last 5x365x24 non-nan values
         hours_in_5_years = 5 * 365 * 24
-        
+
         # Drop NaN values and extract the last `hours_in_5_years` non-NaN data points
         data_series_old_nonan = data_series_old.dropna()
         data_series_old_last_5_years = data_series_old_nonan.iloc[
-            -min(len(data_series_old), hours_in_5_years):]
-        
+            -min(len(data_series_old), hours_in_5_years) :
+        ]
+
         # Perform a linear fit on the last 5 years of data
         fit = np.polyfit(
-            data_series_old_last_5_years.index.astype('int64'),  
-            data_series_old_last_5_years.values, 1
+            data_series_old_last_5_years.index.astype("int64"),
+            data_series_old_last_5_years.values,
+            1,
         )
         fit_fn = np.poly1d(fit)
-        
-        data_series_new = data_series_new.values \
-                        + fit_fn(data_series_new.index.astype('int64')[0]) \
-                        - data_series_new[first_new_idx]
-    
+
+        data_series_new = (
+            data_series_new.values
+            + fit_fn(data_series_new.index.astype("int64")[0])
+            - data_series_new[first_new_idx]
+        )
+
     return data_series_new
 
+
 def build_station_list(config_folder: str, target_station_site: str) -> list:
     """
     Get a list of unique station information dictionaries for a given station site.
@@ -248,109 +321,132 @@ def build_station_list(config_folder: str, target_station_site: str) -> list:
         A list of dictionaries containing station information that have the specified station site.
     """
     station_info_list = []  # Initialize an empty list to store station information
-    
+
     found_as_station = False
     for filename in os.listdir(config_folder):
         if filename.endswith(".toml"):
             file_path = os.path.join(config_folder, filename)
-            
-            with open(file_path, 'r') as file:
+
+            with open(file_path, "r") as file:
                 data = toml.load(file)  # Load the TOML file
                 station_site = data.get("station_site")  # Get the station site
                 stid = data.get("stid")  # Get the station ID
-                
+
                 # Check if the station site matches the target and stid is unique
                 if stid == target_station_site:
                     found_as_station = True
                 if station_site == target_station_site and stid:
                     station_info = data.copy()  # Copy all attributes from the TOML file
-                    station_info_list.append(station_info)  # Add the station info to the list
-    
-                    
-    if len(station_info_list)==0 and not found_as_station:
-        logger.error('\n***\nNo station_configuration file found for %s.\nProcessing it as a single-station PROMICE site.\n***'%target_station_site)
+                    station_info_list.append(
+                        station_info
+                    )  # Add the station info to the list
+
+    if len(station_info_list) == 0 and not found_as_station:
+        logger.error(
+            "\n***\nNo station_configuration file found for %s.\nProcessing it as a single-station PROMICE site.\n***"
+            % target_station_site
+        )
         station_info = {
             "stid": target_station_site,
             "station_site": target_station_site,
             "project": "PROMICE",
             "location_type": "ice sheet",
-                        }
+        }
         station_info_list.append(station_info)
-    elif len(station_info_list)==0 :
-        logger.error('\n***\nThe name \"%s\" passed to join_l3 is a station name and not a site name (e.g. SCO_Lv3 instead of SCO_L). Please provide a site name that is named at least once in the "station_site" attribute of the station configuration files.\n***'%target_station_site)
-        
+    elif len(station_info_list) == 0:
+        logger.error(
+            '\n***\nThe name "%s" passed to join_l3 is a station name and not a site name (e.g. SCO_Lv3 instead of SCO_L). Please provide a site name that is named at least once in the "station_site" attribute of the station configuration files.\n***'
+            % target_station_site
+        )
+
     return station_info_list
 
+
 def join_l3(config_folder, site, folder_l3, folder_gcnet, outpath, variables, metadata):
-   
     # Get the list of station information dictionaries associated with the given site
     list_station_info = build_station_list(config_folder, site)
-    
+
     # Read the datasets and store them into a list along with their latest timestamp and station info
     list_station_data = []
-    for station_info in list_station_info:       
+    for station_info in list_station_info:
         stid = station_info["stid"]
-        
-        filepath = os.path.join(folder_l3, stid, stid+'_hour.nc')
+
+        filepath = os.path.join(folder_l3, stid, stid + "_hour.nc")
         isNead = False
         if station_info["project"].lower() in ["historical gc-net"]:
-            filepath = os.path.join(folder_gcnet, stid+'.csv')
+            filepath = os.path.join(folder_gcnet, stid + ".csv")
             isNead = True
         if not os.path.isfile(filepath):
-            logger.error('\n***\n'+stid+' was listed as station but could not be found in '+folder_l3+' nor '+folder_gcnet+'\n***')
+            logger.error(
+                "\n***\n"
+                + stid
+                + " was listed as station but could not be found in "
+                + folder_l3
+                + " nor "
+                + folder_gcnet
+                + "\n***"
+            )
             continue
 
-        l3, _ = loadArr(filepath, isNead)    
-        
+        l3, _ = loadArr(filepath, isNead)
+
         # removing specific variable from a given file
-        specific_vars_to_drop = station_info.get("skipped_variables",[])
-        if len(specific_vars_to_drop)>0:
-            logger.info("Skipping %s from %s"%(specific_vars_to_drop, stid))
+        specific_vars_to_drop = station_info.get("skipped_variables", [])
+        if len(specific_vars_to_drop) > 0:
+            logger.info("Skipping %s from %s" % (specific_vars_to_drop, stid))
             l3 = l3.drop_vars([var for var in specific_vars_to_drop if var in l3])
 
         list_station_data.append((l3, station_info))
 
     # Sort the list in reverse chronological order so that we start with the latest data
-    sorted_list_station_data = sorted(list_station_data, key=lambda x: x[0].time.min(), reverse=True)
+    sorted_list_station_data = sorted(
+        list_station_data, key=lambda x: x[0].time.min(), reverse=True
+    )
     sorted_stids = [info["stid"] for _, info in sorted_list_station_data]
-    logger.info('joining %s' % ' '.join(sorted_stids))
-    
+    logger.info("joining %s" % " ".join(sorted_stids))
+
     l3_merged = None
 
     for l3, station_info in sorted_list_station_data:
         stid = station_info["stid"]
-        
+
         if l3_merged is None:
             # saving attributes of stid
             st_attrs = {}
             st_attrs[stid] = l3.attrs.copy()
             # adding timestamps info
-            st_attrs[stid]['first_timestamp'] = l3.time.isel(time=0).dt.strftime( date_format='%Y-%m-%d %H:%M:%S').item()
-            st_attrs[stid]['last_timestamp'] = l3.time.isel(time=-1).dt.strftime( date_format='%Y-%m-%d %H:%M:%S').item()
-            
+            st_attrs[stid]["first_timestamp"] = (
+                l3.time.isel(time=0).dt.strftime(date_format="%Y-%m-%d %H:%M:%S").item()
+            )
+            st_attrs[stid]["last_timestamp"] = (
+                l3.time.isel(time=-1)
+                .dt.strftime(date_format="%Y-%m-%d %H:%M:%S")
+                .item()
+            )
+
             # then stripping attributes
             attrs_list = list(l3.attrs.keys())
             for k in attrs_list:
                 del l3.attrs[k]
-          
+
             # initializing l3_merged with l3
             l3_merged = l3.copy()
-            
+
             # creating the station_attributes attribute in l3_merged
             l3_merged.attrs["stations_attributes"] = st_attrs
-            
+
         else:
             # if l3 (older data) is missing variables compared to l3_merged (newer data)
             # , then we fill them with nan
             for v in l3_merged.data_vars:
-                if  v not in l3.data_vars:
-                    l3[v] = l3.t_u*np.nan
+                if v not in l3.data_vars:
+                    l3[v] = l3.t_u * np.nan
             for v in l3.data_vars:
-                if  v not in l3_merged.data_vars:
-                    l3_merged[v] = l3_merged.t_u*np.nan
-            
+                if v not in l3_merged.data_vars:
+                    l3_merged[v] = l3_merged.t_u * np.nan
+
             # saving attributes of station under an attribute called $stid
-            st_attrs = l3_merged.attrs.get('stations_attributes', {})
+            st_attrs = l3_merged.attrs.get("stations_attributes", {})
             st_attrs[stid] = l3.attrs.copy()
             l3_merged.attrs["stations_attributes"] = st_attrs
 
@@ -358,61 +454,84 @@ def join_l3(config_folder, site, folder_l3, folder_gcnet, outpath, variables, me
             attrs_list = list(l3.attrs.keys())
             for k in attrs_list:
                 del l3.attrs[k]
-            
-            l3_merged.attrs['stations_attributes'][stid]['first_timestamp'] = \
-                l3.time.isel(time=0).dt.strftime( date_format='%Y-%m-%d %H:%M:%S').item()
-            l3_merged.attrs['stations_attributes'][stid]['last_timestamp'] = \
-                l3_merged.time.isel(time=0).dt.strftime( date_format='%Y-%m-%d %H:%M:%S').item()
-            
+
+            l3_merged.attrs["stations_attributes"][stid]["first_timestamp"] = (
+                l3.time.isel(time=0).dt.strftime(date_format="%Y-%m-%d %H:%M:%S").item()
+            )
+            l3_merged.attrs["stations_attributes"][stid]["last_timestamp"] = (
+                l3_merged.time.isel(time=0)
+                .dt.strftime(date_format="%Y-%m-%d %H:%M:%S")
+                .item()
+            )
+
             # adjusting surface height in the most recent data (l3_merged)
             # so that it shows continuity with the older data (l3)
-            if 'z_surf_combined' in l3_merged.keys() and 'z_surf_combined' in l3.keys(): 
-                if l3_merged.z_surf_combined.notnull().any() and l3.z_surf_combined.notnull().any(): 
-                    l3_merged['z_surf_combined'] = ('time', 
-                                                align_surface_heights(
-                                                    l3_merged.z_surf_combined.to_series(), 
-                                                    l3.z_surf_combined.to_series())
-                                                    )
-            if 'z_ice_surf' in l3_merged.keys() and 'z_ice_surf' in l3.keys(): 
-                if l3_merged.z_ice_surf.notnull().any() and l3.z_ice_surf.notnull().any(): 
-                    l3_merged['z_ice_surf'] = ('time', 
-                                                align_surface_heights(
-                                                    l3_merged.z_ice_surf.to_series(), 
-                                                    l3.z_ice_surf.to_series())
-                                                    )
+            if "z_surf_combined" in l3_merged.keys() and "z_surf_combined" in l3.keys():
+                if (
+                    l3_merged.z_surf_combined.notnull().any()
+                    and l3.z_surf_combined.notnull().any()
+                ):
+                    l3_merged["z_surf_combined"] = (
+                        "time",
+                        align_surface_heights(
+                            l3_merged.z_surf_combined.to_series(),
+                            l3.z_surf_combined.to_series(),
+                        ),
+                    )
+            if "z_ice_surf" in l3_merged.keys() and "z_ice_surf" in l3.keys():
+                if (
+                    l3_merged.z_ice_surf.notnull().any()
+                    and l3.z_ice_surf.notnull().any()
+                ):
+                    l3_merged["z_ice_surf"] = (
+                        "time",
+                        align_surface_heights(
+                            l3_merged.z_ice_surf.to_series(), l3.z_ice_surf.to_series()
+                        ),
+                    )
 
             # merging by time block
-            l3_merged = xr.concat((l3.sel(
-                        time=slice(l3.time.isel(time=0),
-                                   l3_merged.time.isel(time=0))
-                        ), l3_merged), dim='time')
-            
+            l3_merged = xr.concat(
+                (
+                    l3.sel(
+                        time=slice(l3.time.isel(time=0), l3_merged.time.isel(time=0))
+                    ),
+                    l3_merged,
+                ),
+                dim="time",
+            )
 
     # Assign site id
     if not l3_merged:
-        logger.error('No level 3 station data file found for '+site)
+        logger.error("No level 3 station data file found for " + site)
         return None, sorted_list_station_data
-    l3_merged.attrs['site_id'] = site
-    l3_merged.attrs['stations'] = ' '.join(sorted_stids)
-    l3_merged.attrs['level'] = 'L3'
-    l3_merged.attrs['project'] = sorted_list_station_data[0][1]['project']
-    l3_merged.attrs['location_type'] = sorted_list_station_data[0][1]['location_type']
-    
+    l3_merged.attrs["site_id"] = site
+    l3_merged.attrs["stations"] = " ".join(sorted_stids)
+    l3_merged.attrs["level"] = "L3"
+    l3_merged.attrs["project"] = sorted_list_station_data[0][1]["project"]
+    l3_merged.attrs["location_type"] = sorted_list_station_data[0][1]["location_type"]
+
     v = pypromice.resources.load_variables(variables)
     m = pypromice.resources.load_metadata(metadata)
     if outpath is not None:
-        prepare_and_write(l3_merged, outpath, v, m, '60min')
-        prepare_and_write(l3_merged, outpath, v, m, '1D')
-        prepare_and_write(l3_merged, outpath, v, m, 'M')
+        prepare_and_write(l3_merged, outpath, v, m, "60min")
+        prepare_and_write(l3_merged, outpath, v, m, "1D")
+        prepare_and_write(l3_merged, outpath, v, m, "M")
     return l3_merged, sorted_list_station_data
-        
+
+
 def main():
     args = parse_arguments_joinl3()
-    _, _ = join_l3(args.config_folder, args.site, args.folder_l3, 
-            args.folder_gcnet, args.outpath, args.variables, 
-            args.metadata)
+    _, _ = join_l3(
+        args.config_folder,
+        args.site,
+        args.folder_l3,
+        args.folder_gcnet,
+        args.outpath,
+        args.variables,
+        args.metadata,
+    )
+
 
-           
-if __name__ == "__main__":  
+if __name__ == "__main__":
     main()
-