From ca85179fa90f5ebcbe9ea09d9d3bc8226b9454c7 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 28 Oct 2024 09:52:25 -0500
Subject: [PATCH 01/13] initial transformation function

---
 data_transformation_plugins/__init__.py       |  0
 .../tm54dvar_ch4flux_mask_monthgrid_v5.py     | 43 +++++++++++++++++++
 2 files changed, 43 insertions(+)
 create mode 100644 data_transformation_plugins/__init__.py
 create mode 100644 data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py

diff --git a/data_transformation_plugins/__init__.py b/data_transformation_plugins/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py
new file mode 100644
index 00000000..99fcc503
--- /dev/null
+++ b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py
@@ -0,0 +1,43 @@
+import xarray
+from datetime import datetime
+
+def tm54dvar_ch4flux_mask_monthgrid_v5_transformation(file_obj, name, nodata):
+    """Tranformation function for the tm5 ch4 influx dataset
+
+    Args:
+        file_obj (s3fs object): s3fs sile object for one file of the dataset
+        name (str): name of the file to be transformed
+        nodata (int): Nodata value as specified by the data provider
+
+    Returns:
+        dict: Dictionary with the COG name and its corresponding data array.
+    """
+
+    var_data_netcdf = {}
+    xds = xarray.open_dataset(file_obj)
+    xds = xds.rename({"latitude": "lat", "longitude": "lon"})
+    xds = xds.assign_coords(lon=(((xds.lon + 180) % 360) - 180)).sortby("lon")
+    variable = [var for var in xds.data_vars if "global" not in var]
+
+    for time_increment in range(0, len(xds.months)):
+        filename = name.split("/")[-1]
+        filename_elements = re.split("[_ .]", filename)
+        start_time = datetime(int(filename_elements[-2]), time_increment + 1, 1)
+        for var in variable:
+            data = getattr(xds.isel(months=time_increment), var)
+            data = data.isel(lat=slice(None, None, -1))
+            data = data.where(data == nodata, -9999)
+            data.rio.set_spatial_dims("lon", "lat", inplace=True)
+            data.rio.write_crs("epsg:4326", inplace=True)
+            data.rio.write_nodata(-9999, inplace=True)
+
+            # # insert date of generated COG into filename
+            filename_elements.pop()
+            filename_elements[-1] = start_time.strftime("%Y%m")
+            filename_elements.insert(2, var)
+            cog_filename = "_".join(filename_elements)
+            # # add extension
+            cog_filename = f"{cog_filename}.tif"
+            var_data_netcdf[cog_filename] = data
+
+    return var_data_netcdf
\ No newline at end of file

From 79e5c5b38a4b6b50b0c9dd905c9fd813bb37836e Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 28 Oct 2024 09:52:50 -0500
Subject: [PATCH 02/13] initial transformation function

---
 .../tm54dvar_ch4flux_mask_monthgrid_v5.py                        | 1 +
 1 file changed, 1 insertion(+)

diff --git a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py
index 99fcc503..73168450 100644
--- a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py
+++ b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py
@@ -1,5 +1,6 @@
 import xarray
 from datetime import datetime
+import re
 
 def tm54dvar_ch4flux_mask_monthgrid_v5_transformation(file_obj, name, nodata):
     """Tranformation function for the tm5 ch4 influx dataset

From c567180b6e0801aa2a0ab0d5cded59383b71ffae Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 28 Oct 2024 11:46:10 -0500
Subject: [PATCH 03/13] added transformation plugins for different datasets

---
 data_transformation_plugins/ecco_darwin.py | 47 ++++++++++++++++++++++
 data_transformation_plugins/geos_oco2.py   | 38 +++++++++++++++++
 data_transformation_plugins/gpw.py         | 33 +++++++++++++++
 data_transformation_plugins/push_to_s3.py  | 35 ++++++++++++++++
 4 files changed, 153 insertions(+)
 create mode 100644 data_transformation_plugins/ecco_darwin.py
 create mode 100644 data_transformation_plugins/geos_oco2.py
 create mode 100644 data_transformation_plugins/gpw.py
 create mode 100644 data_transformation_plugins/push_to_s3.py

diff --git a/data_transformation_plugins/ecco_darwin.py b/data_transformation_plugins/ecco_darwin.py
new file mode 100644
index 00000000..90ac2da9
--- /dev/null
+++ b/data_transformation_plugins/ecco_darwin.py
@@ -0,0 +1,47 @@
+import xarray
+import re
+
+def ecco_darwin_transformation(file_obj, name, nodata):
+    """Tranformation function for the ecco darwin dataset
+
+    Args:
+        file_obj (s3fs object): s3fs sile object for one file of the dataset
+        name (str): name of the file to be transformed
+        nodata (int): Nodata value as specified by the data provider
+
+    Returns:
+        dict: Dictionary with the COG name and its corresponding data array.
+    """
+    var_data_netcdf = {}
+    xds = xarray.open_dataset(file_obj)
+    xds = xds.rename({"y": "latitude", "x": "longitude"})
+    xds = xds.assign_coords(longitude=((xds.longitude / 1440) * 360) - 180).sortby(
+        "longitude"
+    )
+    xds = xds.assign_coords(latitude=((xds.latitude / 721) * 180) - 90).sortby(
+        "latitude"
+    )
+
+    variable = [var for var in xds.data_vars]
+
+    for _ in xds.time.values:
+        for var in variable[2:]:
+            filename = name.split("/")[-1]
+            filename_elements = re.split("[_ .]", filename)
+            data = xds[var]
+
+            data = data.reindex(latitude=list(reversed(data.latitude)))
+            data = data.where(data == nodata, -9999)
+            data.rio.set_spatial_dims("longitude", "latitude", inplace=True)
+            data.rio.write_crs("epsg:4326", inplace=True)
+            data.rio.write_nodata(-9999, inplace=True)
+
+            filename_elements.pop()
+            filename_elements[-1] = filename_elements[-2] + filename_elements[-1]
+            filename_elements.pop(-2)
+            # # insert date of generated COG into filename
+            cog_filename = "_".join(filename_elements)
+            # # add extension
+            cog_filename = f"{cog_filename}.tif"
+            var_data_netcdf[cog_filename] = data
+    return var_data_netcdf
\ No newline at end of file
diff --git a/data_transformation_plugins/geos_oco2.py b/data_transformation_plugins/geos_oco2.py
new file mode 100644
index 00000000..f647e33d
--- /dev/null
+++ b/data_transformation_plugins/geos_oco2.py
@@ -0,0 +1,38 @@
+import xarray
+import re
+
+def geos_oco2_transformation(file_obj, name, nodata):
+    """Tranformation function for the oco2 geos dataset
+
+    Args:
+        file_obj (s3fs object): s3fs sile object for one file of the dataset
+        name (str): name of the file to be transformed
+        nodata (int): Nodata value as specified by the data provider
+
+    Returns:
+        dict: Dictionary with the COG name and its corresponding data array.
+    """
+    var_data_netcdf = {}
+    xds = xarray.open_dataset(file_obj)
+    xds = xds.assign_coords(lon=(((xds.lon + 180) % 360) - 180)).sortby("lon")
+    variable = [var for var in xds.data_vars]
+    for time_increment in range(0, len(xds.time)):
+        for var in variable:
+            filename = name.split("/ ")[-1]
+            filename_elements = re.split("[_ .]", filename)
+            data = getattr(xds.isel(time=time_increment), var)
+            data = data.isel(lat=slice(None, None, -1))
+            data = data.where(data == nodata, -9999)
+            data.rio.set_spatial_dims("lon", "lat", inplace=True)
+            data.rio.write_crs("epsg:4326", inplace=True)
+            data.rio.write_nodata(-9999, inplace=True)
+            # # insert date of generated COG into filename
+            filename_elements[-1] = filename_elements[-3]
+            filename_elements.insert(2, var)
+            filename_elements.pop(-3)
+            cog_filename = "_".join(filename_elements)
+            # # add extension
+            cog_filename = f"{cog_filename}.tif"
+            var_data_netcdf[cog_filename] = data
+
+    return var_data_netcdf
\ No newline at end of file
diff --git a/data_transformation_plugins/gpw.py b/data_transformation_plugins/gpw.py
new file mode 100644
index 00000000..6f030623
--- /dev/null
+++ b/data_transformation_plugins/gpw.py
@@ -0,0 +1,33 @@
+import xarray
+import re
+
+def gpw_transformation(file_obj, name, nodata):
+    """Tranformation function for the gridded population dataset
+
+    Args:
+        file_obj (s3fs object): s3fs sile object for one file of the dataset
+        name (str): name of the file to be transformed
+        nodata (int): Nodata value as specified by the data provider
+
+    Returns:
+        dict: Dictionary with the COG name and its corresponding data array.
+    """
+
+    var_data_netcdf = {}
+    xds = xarray.open_dataarray(file_obj, engine="rasterio")
+
+    filename = name.split("/")[-1]
+    filename_elements = re.split("[_ .]", filename)
+    # # insert date of generated COG into filename
+    filename_elements.pop()
+    filename_elements.append(filename_elements[-3])
+    xds = xds.where(xds == nodata, -9999)
+    xds.rio.set_spatial_dims("x", "y", inplace=True)
+    xds.rio.write_crs("epsg:4326", inplace=True)
+    xds.rio.write_nodata(-9999, inplace=True)
+
+    cog_filename = "_".join(filename_elements)
+    # # add extension
+    cog_filename = f"{cog_filename}.tif"
+    var_data_netcdf[cog_filename] = xds
+    return var_data_netcdf
\ No newline at end of file
diff --git a/data_transformation_plugins/push_to_s3.py b/data_transformation_plugins/push_to_s3.py
new file mode 100644
index 00000000..18617f9a
--- /dev/null
+++ b/data_transformation_plugins/push_to_s3.py
@@ -0,0 +1,35 @@
+import boto3
+import os
+
+def upload_folder_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
+    """
+    Uploads all files in a folder to a specified S3 folder, excluding specified files.
+
+    Parameters:
+    - folder_path (str): Path to the local folder containing files to upload.
+    - bucket_name (str): Name of the S3 bucket.
+    - s3_folder (str): Destination folder path in the S3 bucket.
+    - exclude_files (list): List of files to exclude from uploading.
+    """
+    # Initialize S3 client
+    s3 = boto3.client('s3')
+
+    # Loop through files in the local folder
+    for file_name in os.listdir(folder_path):
+        file_path = os.path.join(folder_path, file_name)
+        
+        # Check if it's a file and not in the exclude list
+        if os.path.isfile(file_path) and file_name not in exclude_files:
+            s3_key = os.path.join(s3_folder, file_name)
+            
+            try:
+                # Upload the file
+                s3.upload_file(file_path, bucket_name, s3_key)
+                print(f"Uploaded {file_name} to {s3_key}")
+            except Exception as e:
+                print(f"Error uploading {file_name}: {e}")
+
+# Example usage:
+# upload_folder_to_s3("path/to/local/folder", "my-s3-bucket", "my/s3/folder", ["exclude1.ext", "exclude2.ext"])
+if __name__ == "__main__":
+    upload_folder_to_s3("data_transformation_plugins", "ghgc-data-store-develop", "data_transformation_plugins", ["__init__.py", "push_to_s3.py"])
\ No newline at end of file

From 08132c8f4b6089c954eaadcaa467d482ca171377 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 28 Oct 2024 14:47:23 -0500
Subject: [PATCH 04/13] add readme for the folder

---
 data_transformation_plugins/README.md | 4 ++++
 1 file changed, 4 insertions(+)
 create mode 100644 data_transformation_plugins/README.md

diff --git a/data_transformation_plugins/README.md b/data_transformation_plugins/README.md
new file mode 100644
index 00000000..008ca8b1
--- /dev/null
+++ b/data_transformation_plugins/README.md
@@ -0,0 +1,4 @@
+The naming convention for the python files is as follows:
+### collectionname_transformation
+where collection name refers to the STAC collection name that we want to provide
+for the given dataset followed by the tword `transformation`. Make sure that the collection name in the function is same to the one passed as argument when running the DAG. 
\ No newline at end of file

From 11dac6eac2fd0d7ad560a45e0abb05b07c51e403 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 28 Oct 2024 14:58:21 -0500
Subject: [PATCH 05/13] updated the README file

---
 data_transformation_plugins/README.md | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/data_transformation_plugins/README.md b/data_transformation_plugins/README.md
index 008ca8b1..26524176 100644
--- a/data_transformation_plugins/README.md
+++ b/data_transformation_plugins/README.md
@@ -1,4 +1,9 @@
-The naming convention for the python files is as follows:
-### collectionname_transformation
-where collection name refers to the STAC collection name that we want to provide
-for the given dataset followed by the tword `transformation`. Make sure that the collection name in the function is same to the one passed as argument when running the DAG. 
\ No newline at end of file
+## Information about the folder
+This folder is a part of the `automation pipeline using DAG`. It contains the functions which are essential for transforming the given dataset into COGs. There are python files for transforming every dataset which will be used as plugins into the pipeline.
+
+## How this folder fits in the automation pipeline
+These functions/files are created by the `developer` to transform a single data file to COG. Once the COGs are validated, these python scripts are pushed to the `GHGC-SMCE S3` These files are then fetched by the `SM2A DAG` to complete the transformation of entire dataset automatically.
+
+## Naming convention for the transformation files in the folder
+- `name of python file` - `collectionname_transformation.py`
+`collectionname` refers to the STAC collection name of the dataset followed by the word `transformation`. Make sure the `collectionname` within the filename matches with the `collectionname` passed as a `parameter` to the DAG.
\ No newline at end of file

From 40f7c369a4677643544345f9d9b0d212632fa71b Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Tue, 29 Oct 2024 12:24:45 -0500
Subject: [PATCH 06/13] updated file names as per the convention and changed
 the logic for finding files in S3

---
 ...darwin.py => ecco_darwin_tranformation.py} |  0
 ...os_oco2.py => geos_oco2_transformation.py} |  0
 .../{gpw.py => gpw_transformation.py}         |  0
 data_transformation_plugins/push_to_s3.py     | 28 +++++++++++++------
 ...4flux_mask_monthgrid_v5_transformation.py} |  0
 5 files changed, 20 insertions(+), 8 deletions(-)
 rename data_transformation_plugins/{ecco_darwin.py => ecco_darwin_tranformation.py} (100%)
 rename data_transformation_plugins/{geos_oco2.py => geos_oco2_transformation.py} (100%)
 rename data_transformation_plugins/{gpw.py => gpw_transformation.py} (100%)
 rename data_transformation_plugins/{tm54dvar_ch4flux_mask_monthgrid_v5.py => tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py} (100%)

diff --git a/data_transformation_plugins/ecco_darwin.py b/data_transformation_plugins/ecco_darwin_tranformation.py
similarity index 100%
rename from data_transformation_plugins/ecco_darwin.py
rename to data_transformation_plugins/ecco_darwin_tranformation.py
diff --git a/data_transformation_plugins/geos_oco2.py b/data_transformation_plugins/geos_oco2_transformation.py
similarity index 100%
rename from data_transformation_plugins/geos_oco2.py
rename to data_transformation_plugins/geos_oco2_transformation.py
diff --git a/data_transformation_plugins/gpw.py b/data_transformation_plugins/gpw_transformation.py
similarity index 100%
rename from data_transformation_plugins/gpw.py
rename to data_transformation_plugins/gpw_transformation.py
diff --git a/data_transformation_plugins/push_to_s3.py b/data_transformation_plugins/push_to_s3.py
index 18617f9a..85d52c22 100644
--- a/data_transformation_plugins/push_to_s3.py
+++ b/data_transformation_plugins/push_to_s3.py
@@ -1,9 +1,13 @@
 import boto3
 import os
 
-def upload_folder_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
+import boto3
+import os
+
+def upload_files_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
     """
-    Uploads all files in a folder to a specified S3 folder, excluding specified files.
+    Uploads all files in a folder to a specified S3 folder only if the file does not already exist in S3,
+    and excluding specified files.
 
     Parameters:
     - folder_path (str): Path to the local folder containing files to upload.
@@ -23,13 +27,21 @@ def upload_folder_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
             s3_key = os.path.join(s3_folder, file_name)
             
             try:
-                # Upload the file
-                s3.upload_file(file_path, bucket_name, s3_key)
-                print(f"Uploaded {file_name} to {s3_key}")
-            except Exception as e:
-                print(f"Error uploading {file_name}: {e}")
+                # Check if the file already exists in S3
+                s3.head_object(Bucket=bucket_name, Key=s3_key)
+                print(f"Skipped {file_name} (already exists in S3)")
+            except s3.exceptions.ClientError as e:
+                # If the file does not exist, upload it
+                if e.response['Error']['Code'] == '404':
+                    try:
+                        s3.upload_file(file_path, bucket_name, s3_key)
+                        print(f"Uploaded {file_name} to {s3_key}")
+                    except Exception as upload_error:
+                        print(f"Error uploading {file_name}: {upload_error}")
+                else:
+                    print(f"Error checking existence of {file_name}: {e}")
 
 # Example usage:
 # upload_folder_to_s3("path/to/local/folder", "my-s3-bucket", "my/s3/folder", ["exclude1.ext", "exclude2.ext"])
 if __name__ == "__main__":
-    upload_folder_to_s3("data_transformation_plugins", "ghgc-data-store-develop", "data_transformation_plugins", ["__init__.py", "push_to_s3.py"])
\ No newline at end of file
+    upload_files_to_s3("data_transformation_plugins", "ghgc-data-store-develop", "data_transformation_plugins", ["__init__.py", "push_to_s3.py", "README.md"])
\ No newline at end of file
diff --git a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py
similarity index 100%
rename from data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5.py
rename to data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py

From d80620e241656b3b42b59628de900990fd109ca7 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Tue, 29 Oct 2024 16:45:36 -0500
Subject: [PATCH 07/13] updated the logic for no data value and a script to
 transform gosat ch4

---
 ...ation.py => ecco_darwin_transformation.py} |  2 +-
 .../geos_oco2_transformation.py               |  2 +-
 .../gosat_ch4_transformation.py               | 36 +++++++++++++++++++
 .../gpw_transformation.py                     |  2 +-
 ...h4flux_mask_monthgrid_v5_transformation.py |  2 +-
 5 files changed, 40 insertions(+), 4 deletions(-)
 rename data_transformation_plugins/{ecco_darwin_tranformation.py => ecco_darwin_transformation.py} (97%)
 create mode 100644 data_transformation_plugins/gosat_ch4_transformation.py

diff --git a/data_transformation_plugins/ecco_darwin_tranformation.py b/data_transformation_plugins/ecco_darwin_transformation.py
similarity index 97%
rename from data_transformation_plugins/ecco_darwin_tranformation.py
rename to data_transformation_plugins/ecco_darwin_transformation.py
index 90ac2da9..9696a372 100644
--- a/data_transformation_plugins/ecco_darwin_tranformation.py
+++ b/data_transformation_plugins/ecco_darwin_transformation.py
@@ -31,7 +31,7 @@ def ecco_darwin_transformation(file_obj, name, nodata):
             data = xds[var]
 
             data = data.reindex(latitude=list(reversed(data.latitude)))
-            data = data.where(data == nodata, -9999)
+            data = data.where(data != nodata, -9999)
             data.rio.set_spatial_dims("longitude", "latitude", inplace=True)
             data.rio.write_crs("epsg:4326", inplace=True)
             data.rio.write_nodata(-9999, inplace=True)
diff --git a/data_transformation_plugins/geos_oco2_transformation.py b/data_transformation_plugins/geos_oco2_transformation.py
index f647e33d..4165c91e 100644
--- a/data_transformation_plugins/geos_oco2_transformation.py
+++ b/data_transformation_plugins/geos_oco2_transformation.py
@@ -22,7 +22,7 @@ def geos_oco2_transformation(file_obj, name, nodata):
             filename_elements = re.split("[_ .]", filename)
             data = getattr(xds.isel(time=time_increment), var)
             data = data.isel(lat=slice(None, None, -1))
-            data = data.where(data == nodata, -9999)
+            data = data.where(data != nodata, -9999)
             data.rio.set_spatial_dims("lon", "lat", inplace=True)
             data.rio.write_crs("epsg:4326", inplace=True)
             data.rio.write_nodata(-9999, inplace=True)
diff --git a/data_transformation_plugins/gosat_ch4_transformation.py b/data_transformation_plugins/gosat_ch4_transformation.py
new file mode 100644
index 00000000..a9adbb3e
--- /dev/null
+++ b/data_transformation_plugins/gosat_ch4_transformation.py
@@ -0,0 +1,36 @@
+import xarray
+import re
+
+def gosat_ch4_transformation(file_obj, name, nodata):
+    """Tranformation function for the ecco darwin dataset
+
+    Args:
+        file_obj (s3fs object): s3fs sile object for one file of the dataset
+        name (str): name of the file to be transformed
+        nodata (int): Nodata value as specified by the data provider
+
+    Returns:
+        dict: Dictionary with the COG name and its corresponding data array.
+    """
+    var_data_netcdf = {}
+    ds = xarray.open_dataset(file_obj)
+    variable = [var for var in ds.data_vars]
+
+    for var in variable:
+        filename = name.split("/")[-1]
+        filename_elements = re.split("[_ .]", filename)
+        data = ds[var]
+        filename_elements.pop()
+        filename_elements.insert(2, var)
+        cog_filename = "_".join(filename_elements)
+        # # add extension
+        cog_filename = f"{cog_filename}.tif"
+
+        data = data.reindex(lat=list(reversed(data.lat)))
+        data = data.where(data != -9999, -9999)
+        data.rio.write_nodata(-9999, inplace=True)
+
+        data.rio.set_spatial_dims("lon", "lat")
+        data.rio.write_crs("epsg:4326", inplace=True)
+        var_data_netcdf[cog_filename] = data
+    return var_data_netcdf
\ No newline at end of file
diff --git a/data_transformation_plugins/gpw_transformation.py b/data_transformation_plugins/gpw_transformation.py
index 6f030623..5849f350 100644
--- a/data_transformation_plugins/gpw_transformation.py
+++ b/data_transformation_plugins/gpw_transformation.py
@@ -21,7 +21,7 @@ def gpw_transformation(file_obj, name, nodata):
     # # insert date of generated COG into filename
     filename_elements.pop()
     filename_elements.append(filename_elements[-3])
-    xds = xds.where(xds == nodata, -9999)
+    xds = xds.where(xds != nodata, -9999)
     xds.rio.set_spatial_dims("x", "y", inplace=True)
     xds.rio.write_crs("epsg:4326", inplace=True)
     xds.rio.write_nodata(-9999, inplace=True)
diff --git a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py
index 73168450..7565ec8a 100644
--- a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py
+++ b/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py
@@ -27,7 +27,7 @@ def tm54dvar_ch4flux_mask_monthgrid_v5_transformation(file_obj, name, nodata):
         for var in variable:
             data = getattr(xds.isel(months=time_increment), var)
             data = data.isel(lat=slice(None, None, -1))
-            data = data.where(data == nodata, -9999)
+            data = data.where(data != nodata, -9999)
             data.rio.set_spatial_dims("lon", "lat", inplace=True)
             data.rio.write_crs("epsg:4326", inplace=True)
             data.rio.write_nodata(-9999, inplace=True)

From 5dcb6022793d942595f600a815f923e72698c448 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Thu, 31 Oct 2024 09:12:06 -0500
Subject: [PATCH 08/13] resolved the comments

---
 .../ecco_darwin_transformation.py             | 38 +++++++++----------
 .../gosat_ch4_transformation.py               |  1 +
 .../gpw_transformation.py                     |  1 +
 3 files changed, 21 insertions(+), 19 deletions(-)

diff --git a/data_transformation_plugins/ecco_darwin_transformation.py b/data_transformation_plugins/ecco_darwin_transformation.py
index 9696a372..b31c2c13 100644
--- a/data_transformation_plugins/ecco_darwin_transformation.py
+++ b/data_transformation_plugins/ecco_darwin_transformation.py
@@ -22,26 +22,26 @@ def ecco_darwin_transformation(file_obj, name, nodata):
         "latitude"
     )
 
-    variable = [var for var in xds.data_vars]
+    variables = list(xds.data_vars)[2:]
 
-    for _ in xds.time.values:
-        for var in variable[2:]:
-            filename = name.split("/")[-1]
-            filename_elements = re.split("[_ .]", filename)
-            data = xds[var]
+    for var in variables:
+        filename = name.split("/")[-1]
+        filename_elements = re.split("[_ .]", filename)
+        data = xds[var]
 
-            data = data.reindex(latitude=list(reversed(data.latitude)))
-            data = data.where(data != nodata, -9999)
-            data.rio.set_spatial_dims("longitude", "latitude", inplace=True)
-            data.rio.write_crs("epsg:4326", inplace=True)
-            data.rio.write_nodata(-9999, inplace=True)
+        data = data.reindex(latitude=list(reversed(data.latitude)))
+        data = data.where(data != nodata, -9999)
+        data.rio.set_spatial_dims("longitude", "latitude", inplace=True)
+        data.rio.write_crs("epsg:4326", inplace=True)
+        data.rio.write_nodata(-9999, inplace=True)
 
-            filename_elements.pop()
-            filename_elements[-1] = filename_elements[-2] + filename_elements[-1]
-            filename_elements.pop(-2)
-            # # insert date of generated COG into filename
-            cog_filename = "_".join(filename_elements)
-            # # add extension
-            cog_filename = f"{cog_filename}.tif"
-            var_data_netcdf[cog_filename] = data
+        filename_elements.pop()
+        filename_elements[-1] = filename_elements[-2] + filename_elements[-1]
+        filename_elements.pop(-2)
+        # # insert date of generated COG into filename
+        cog_filename = "_".join(filename_elements)
+        # # add extension
+        cog_filename = f"{cog_filename}.tif"
+        var_data_netcdf[cog_filename] = data
+        
     return var_data_netcdf
\ No newline at end of file
diff --git a/data_transformation_plugins/gosat_ch4_transformation.py b/data_transformation_plugins/gosat_ch4_transformation.py
index a9adbb3e..7a88b85f 100644
--- a/data_transformation_plugins/gosat_ch4_transformation.py
+++ b/data_transformation_plugins/gosat_ch4_transformation.py
@@ -33,4 +33,5 @@ def gosat_ch4_transformation(file_obj, name, nodata):
         data.rio.set_spatial_dims("lon", "lat")
         data.rio.write_crs("epsg:4326", inplace=True)
         var_data_netcdf[cog_filename] = data
+    
     return var_data_netcdf
\ No newline at end of file
diff --git a/data_transformation_plugins/gpw_transformation.py b/data_transformation_plugins/gpw_transformation.py
index 5849f350..fde5d1f7 100644
--- a/data_transformation_plugins/gpw_transformation.py
+++ b/data_transformation_plugins/gpw_transformation.py
@@ -30,4 +30,5 @@ def gpw_transformation(file_obj, name, nodata):
     # # add extension
     cog_filename = f"{cog_filename}.tif"
     var_data_netcdf[cog_filename] = xds
+    
     return var_data_netcdf
\ No newline at end of file

From 0b0870d7352d5364d73bc3fff70619dc6192e95e Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Fri, 1 Nov 2024 10:12:13 -0500
Subject: [PATCH 09/13] added a sample transformation notebook along with
 updating the README file

---
 data_transformation_plugins/README.md         |   8 +-
 data_transformation_plugins/push_to_s3.py     |   2 +-
 .../sample_transformation.ipynb               | 102 ++++++++++++++++++
 3 files changed, 110 insertions(+), 2 deletions(-)
 create mode 100644 data_transformation_plugins/sample_transformation.ipynb

diff --git a/data_transformation_plugins/README.md b/data_transformation_plugins/README.md
index 26524176..9160fa89 100644
--- a/data_transformation_plugins/README.md
+++ b/data_transformation_plugins/README.md
@@ -6,4 +6,10 @@ These functions/files are created by the `developer` to transform a single data
 
 ## Naming convention for the transformation files in the folder
 - `name of python file` - `collectionname_transformation.py`
-`collectionname` refers to the STAC collection name of the dataset followed by the word `transformation`. Make sure the `collectionname` within the filename matches with the `collectionname` passed as a `parameter` to the DAG.
\ No newline at end of file
+`collectionname` refers to the STAC collection name of the dataset followed by the word `transformation`. Make sure the `collectionname` within the filename matches with the `collectionname` passed as a `parameter` to the DAG.
+
+## Steps for running the pipeline
+- Test convert a single netCDF file for a new dataset using the `sample_transformation.ipynb` notebook.
+- Create a new `data transformation plugin` python file for the new dataset using the convention mentioned above.
+- `push_to_s3.py` is not yet plugged into the `CI/CD pipeline` so after creating the plugin, run the python file in the terminal. Running the python file will only push the files that are not present on the S3 folder.
+- At this point, the tasks from `ghgc-docs` are completed.
\ No newline at end of file
diff --git a/data_transformation_plugins/push_to_s3.py b/data_transformation_plugins/push_to_s3.py
index 85d52c22..7f941bc9 100644
--- a/data_transformation_plugins/push_to_s3.py
+++ b/data_transformation_plugins/push_to_s3.py
@@ -44,4 +44,4 @@ def upload_files_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
 # Example usage:
 # upload_folder_to_s3("path/to/local/folder", "my-s3-bucket", "my/s3/folder", ["exclude1.ext", "exclude2.ext"])
 if __name__ == "__main__":
-    upload_files_to_s3("data_transformation_plugins", "ghgc-data-store-develop", "data_transformation_plugins", ["__init__.py", "push_to_s3.py", "README.md"])
\ No newline at end of file
+    upload_files_to_s3("data_transformation_plugins", "ghgc-data-store-develop", "data_transformation_plugins", ["__init__.py", "push_to_s3.py", "README.md", "sample_transformation.ipynb"])
\ No newline at end of file
diff --git a/data_transformation_plugins/sample_transformation.ipynb b/data_transformation_plugins/sample_transformation.ipynb
new file mode 100644
index 00000000..1f98a392
--- /dev/null
+++ b/data_transformation_plugins/sample_transformation.ipynb
@@ -0,0 +1,102 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Instructions on how to transform a single file\n",
+    "Install the required libraries in an isolated environment"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import xarray\n",
+    "import re\n",
+    "from datetime import datetime"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Read a file of the new dataset\n",
+    "name = 'test.nc'\n",
+    "ds = xarray.open_dataset(name) # open the file\n",
+    "print('The netcdf file contains information as shown below')\n",
+    "ds"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Explore the netCDF file\n",
+    "print('Data valriables in the netCDF file are', ds.data_vars)\n",
+    "print('Dimensions mentioned in the netCDF file are', ds.dims)\n",
+    "#..... explore the netCDf file for more information"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# once explored, look at the latitude, longitude and other values and comvert them if needed.\n",
+    "ds = ds.rename({\"latitude\": \"lat\", \"longitude\": \"lon\"})\n",
+    "ds = ds.assign_coords(lon=(((ds.lon + 180) % 360) - 180)).sortby(\"lon\")\n",
+    "variable = [var for var in ds.data_vars]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Parse through the time variable to extract single timestamp and create a dataarray for the given timestamp.\n",
+    "for time_increment in range(0, len(ds.months)):\n",
+    "    # split the original file name to create a unique COG name\n",
+    "    filename = name.split(\"/ \")[-1]\n",
+    "    filename_elements = re.split(\"[_ .]\", filename)\n",
+    "    start_time = datetime(int(filename_elements[-2]), time_increment + 1, 1)\n",
+    "    for var in variable: # Parse through the data variables\n",
+    "        data = getattr(ds.isel(months=time_increment), var)\n",
+    "        data = data.isel(lat=slice(None, None, -1))\n",
+    "        data.rio.set_spatial_dims(\"lon\", \"lat\", inplace=True)\n",
+    "        data.rio.write_crs(\"epsg:4326\", inplace=True)\n",
+    "\n",
+    "        # # insert date of generated COG into filename\n",
+    "        filename_elements.pop()\n",
+    "        filename_elements[-1] = start_time.strftime(\"%Y%m\")\n",
+    "        filename_elements.insert(2, var)\n",
+    "        cog_filename = \"_\".join(filename_elements)\n",
+    "        # # add extension\n",
+    "        cog_filename = f\"{cog_filename}.tif\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Validate the COG using QGIS or any other means.\n",
+    "Once validated, follow the steps mentioned in the README in the folder `data_transformation_plugins`"
+   ]
+  }
+ ],
+ "metadata": {
+  "language_info": {
+   "name": "python"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

From dcb3db1364c6e1e2ac79d337546986419bfbca50 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 11 Nov 2024 14:37:44 -0600
Subject: [PATCH 10/13] tm5 new data transformation plugin

---
 ...hgrid_v5_transformation.py => tm54dvar_noaa_transformation.py} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename data_transformation_plugins/{tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py => tm54dvar_noaa_transformation.py} (100%)

diff --git a/data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py b/data_transformation_plugins/tm54dvar_noaa_transformation.py
similarity index 100%
rename from data_transformation_plugins/tm54dvar_ch4flux_mask_monthgrid_v5_transformation.py
rename to data_transformation_plugins/tm54dvar_noaa_transformation.py

From d94aed272bc59788b8cf59e9e79aaa57223e72fd Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Mon, 11 Nov 2024 15:18:29 -0600
Subject: [PATCH 11/13] updated the tm5 transformation script

---
 .../sample_transformation.ipynb               | 595 +++++++++++++++++-
 ...> tm5_4dvar_update_noaa_transformation.py} |   4 +-
 2 files changed, 590 insertions(+), 9 deletions(-)
 rename data_transformation_plugins/{tm54dvar_noaa_transformation.py => tm5_4dvar_update_noaa_transformation.py} (91%)

diff --git a/data_transformation_plugins/sample_transformation.ipynb b/data_transformation_plugins/sample_transformation.ipynb
index 1f98a392..44dd8c02 100644
--- a/data_transformation_plugins/sample_transformation.ipynb
+++ b/data_transformation_plugins/sample_transformation.ipynb
@@ -10,7 +10,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -21,12 +21,461 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The netcdf file contains information as shown below\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div><svg style=\"position: absolute; width: 0; height: 0; overflow: hidden\">\n",
+       "<defs>\n",
+       "<symbol id=\"icon-database\" viewBox=\"0 0 32 32\">\n",
+       "<path d=\"M16 0c-8.837 0-16 2.239-16 5v4c0 2.761 7.163 5 16 5s16-2.239 16-5v-4c0-2.761-7.163-5-16-5z\"></path>\n",
+       "<path d=\"M16 17c-8.837 0-16-2.239-16-5v6c0 2.761 7.163 5 16 5s16-2.239 16-5v-6c0 2.761-7.163 5-16 5z\"></path>\n",
+       "<path d=\"M16 26c-8.837 0-16-2.239-16-5v6c0 2.761 7.163 5 16 5s16-2.239 16-5v-6c0 2.761-7.163 5-16 5z\"></path>\n",
+       "</symbol>\n",
+       "<symbol id=\"icon-file-text2\" viewBox=\"0 0 32 32\">\n",
+       "<path d=\"M28.681 7.159c-0.694-0.947-1.662-2.053-2.724-3.116s-2.169-2.030-3.116-2.724c-1.612-1.182-2.393-1.319-2.841-1.319h-15.5c-1.378 0-2.5 1.121-2.5 2.5v27c0 1.378 1.122 2.5 2.5 2.5h23c1.378 0 2.5-1.122 2.5-2.5v-19.5c0-0.448-0.137-1.23-1.319-2.841zM24.543 5.457c0.959 0.959 1.712 1.825 2.268 2.543h-4.811v-4.811c0.718 0.556 1.584 1.309 2.543 2.268zM28 29.5c0 0.271-0.229 0.5-0.5 0.5h-23c-0.271 0-0.5-0.229-0.5-0.5v-27c0-0.271 0.229-0.5 0.5-0.5 0 0 15.499-0 15.5 0v7c0 0.552 0.448 1 1 1h7v19.5z\"></path>\n",
+       "<path d=\"M23 26h-14c-0.552 0-1-0.448-1-1s0.448-1 1-1h14c0.552 0 1 0.448 1 1s-0.448 1-1 1z\"></path>\n",
+       "<path d=\"M23 22h-14c-0.552 0-1-0.448-1-1s0.448-1 1-1h14c0.552 0 1 0.448 1 1s-0.448 1-1 1z\"></path>\n",
+       "<path d=\"M23 18h-14c-0.552 0-1-0.448-1-1s0.448-1 1-1h14c0.552 0 1 0.448 1 1s-0.448 1-1 1z\"></path>\n",
+       "</symbol>\n",
+       "</defs>\n",
+       "</svg>\n",
+       "<style>/* CSS stylesheet for displaying xarray objects in jupyterlab.\n",
+       " *\n",
+       " */\n",
+       "\n",
+       ":root {\n",
+       "  --xr-font-color0: var(--jp-content-font-color0, rgba(0, 0, 0, 1));\n",
+       "  --xr-font-color2: var(--jp-content-font-color2, rgba(0, 0, 0, 0.54));\n",
+       "  --xr-font-color3: var(--jp-content-font-color3, rgba(0, 0, 0, 0.38));\n",
+       "  --xr-border-color: var(--jp-border-color2, #e0e0e0);\n",
+       "  --xr-disabled-color: var(--jp-layout-color3, #bdbdbd);\n",
+       "  --xr-background-color: var(--jp-layout-color0, white);\n",
+       "  --xr-background-color-row-even: var(--jp-layout-color1, white);\n",
+       "  --xr-background-color-row-odd: var(--jp-layout-color2, #eeeeee);\n",
+       "}\n",
+       "\n",
+       "html[theme=dark],\n",
+       "body[data-theme=dark],\n",
+       "body.vscode-dark {\n",
+       "  --xr-font-color0: rgba(255, 255, 255, 1);\n",
+       "  --xr-font-color2: rgba(255, 255, 255, 0.54);\n",
+       "  --xr-font-color3: rgba(255, 255, 255, 0.38);\n",
+       "  --xr-border-color: #1F1F1F;\n",
+       "  --xr-disabled-color: #515151;\n",
+       "  --xr-background-color: #111111;\n",
+       "  --xr-background-color-row-even: #111111;\n",
+       "  --xr-background-color-row-odd: #313131;\n",
+       "}\n",
+       "\n",
+       ".xr-wrap {\n",
+       "  display: block !important;\n",
+       "  min-width: 300px;\n",
+       "  max-width: 700px;\n",
+       "}\n",
+       "\n",
+       ".xr-text-repr-fallback {\n",
+       "  /* fallback to plain text repr when CSS is not injected (untrusted notebook) */\n",
+       "  display: none;\n",
+       "}\n",
+       "\n",
+       ".xr-header {\n",
+       "  padding-top: 6px;\n",
+       "  padding-bottom: 6px;\n",
+       "  margin-bottom: 4px;\n",
+       "  border-bottom: solid 1px var(--xr-border-color);\n",
+       "}\n",
+       "\n",
+       ".xr-header > div,\n",
+       ".xr-header > ul {\n",
+       "  display: inline;\n",
+       "  margin-top: 0;\n",
+       "  margin-bottom: 0;\n",
+       "}\n",
+       "\n",
+       ".xr-obj-type,\n",
+       ".xr-array-name {\n",
+       "  margin-left: 2px;\n",
+       "  margin-right: 10px;\n",
+       "}\n",
+       "\n",
+       ".xr-obj-type {\n",
+       "  color: var(--xr-font-color2);\n",
+       "}\n",
+       "\n",
+       ".xr-sections {\n",
+       "  padding-left: 0 !important;\n",
+       "  display: grid;\n",
+       "  grid-template-columns: 150px auto auto 1fr 20px 20px;\n",
+       "}\n",
+       "\n",
+       ".xr-section-item {\n",
+       "  display: contents;\n",
+       "}\n",
+       "\n",
+       ".xr-section-item input {\n",
+       "  display: none;\n",
+       "}\n",
+       "\n",
+       ".xr-section-item input + label {\n",
+       "  color: var(--xr-disabled-color);\n",
+       "}\n",
+       "\n",
+       ".xr-section-item input:enabled + label {\n",
+       "  cursor: pointer;\n",
+       "  color: var(--xr-font-color2);\n",
+       "}\n",
+       "\n",
+       ".xr-section-item input:enabled + label:hover {\n",
+       "  color: var(--xr-font-color0);\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary {\n",
+       "  grid-column: 1;\n",
+       "  color: var(--xr-font-color2);\n",
+       "  font-weight: 500;\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary > span {\n",
+       "  display: inline-block;\n",
+       "  padding-left: 0.5em;\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary-in:disabled + label {\n",
+       "  color: var(--xr-font-color2);\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary-in + label:before {\n",
+       "  display: inline-block;\n",
+       "  content: '►';\n",
+       "  font-size: 11px;\n",
+       "  width: 15px;\n",
+       "  text-align: center;\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary-in:disabled + label:before {\n",
+       "  color: var(--xr-disabled-color);\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary-in:checked + label:before {\n",
+       "  content: '▼';\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary-in:checked + label > span {\n",
+       "  display: none;\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary,\n",
+       ".xr-section-inline-details {\n",
+       "  padding-top: 4px;\n",
+       "  padding-bottom: 4px;\n",
+       "}\n",
+       "\n",
+       ".xr-section-inline-details {\n",
+       "  grid-column: 2 / -1;\n",
+       "}\n",
+       "\n",
+       ".xr-section-details {\n",
+       "  display: none;\n",
+       "  grid-column: 1 / -1;\n",
+       "  margin-bottom: 5px;\n",
+       "}\n",
+       "\n",
+       ".xr-section-summary-in:checked ~ .xr-section-details {\n",
+       "  display: contents;\n",
+       "}\n",
+       "\n",
+       ".xr-array-wrap {\n",
+       "  grid-column: 1 / -1;\n",
+       "  display: grid;\n",
+       "  grid-template-columns: 20px auto;\n",
+       "}\n",
+       "\n",
+       ".xr-array-wrap > label {\n",
+       "  grid-column: 1;\n",
+       "  vertical-align: top;\n",
+       "}\n",
+       "\n",
+       ".xr-preview {\n",
+       "  color: var(--xr-font-color3);\n",
+       "}\n",
+       "\n",
+       ".xr-array-preview,\n",
+       ".xr-array-data {\n",
+       "  padding: 0 5px !important;\n",
+       "  grid-column: 2;\n",
+       "}\n",
+       "\n",
+       ".xr-array-data,\n",
+       ".xr-array-in:checked ~ .xr-array-preview {\n",
+       "  display: none;\n",
+       "}\n",
+       "\n",
+       ".xr-array-in:checked ~ .xr-array-data,\n",
+       ".xr-array-preview {\n",
+       "  display: inline-block;\n",
+       "}\n",
+       "\n",
+       ".xr-dim-list {\n",
+       "  display: inline-block !important;\n",
+       "  list-style: none;\n",
+       "  padding: 0 !important;\n",
+       "  margin: 0;\n",
+       "}\n",
+       "\n",
+       ".xr-dim-list li {\n",
+       "  display: inline-block;\n",
+       "  padding: 0;\n",
+       "  margin: 0;\n",
+       "}\n",
+       "\n",
+       ".xr-dim-list:before {\n",
+       "  content: '(';\n",
+       "}\n",
+       "\n",
+       ".xr-dim-list:after {\n",
+       "  content: ')';\n",
+       "}\n",
+       "\n",
+       ".xr-dim-list li:not(:last-child):after {\n",
+       "  content: ',';\n",
+       "  padding-right: 5px;\n",
+       "}\n",
+       "\n",
+       ".xr-has-index {\n",
+       "  font-weight: bold;\n",
+       "}\n",
+       "\n",
+       ".xr-var-list,\n",
+       ".xr-var-item {\n",
+       "  display: contents;\n",
+       "}\n",
+       "\n",
+       ".xr-var-item > div,\n",
+       ".xr-var-item label,\n",
+       ".xr-var-item > .xr-var-name span {\n",
+       "  background-color: var(--xr-background-color-row-even);\n",
+       "  margin-bottom: 0;\n",
+       "}\n",
+       "\n",
+       ".xr-var-item > .xr-var-name:hover span {\n",
+       "  padding-right: 5px;\n",
+       "}\n",
+       "\n",
+       ".xr-var-list > li:nth-child(odd) > div,\n",
+       ".xr-var-list > li:nth-child(odd) > label,\n",
+       ".xr-var-list > li:nth-child(odd) > .xr-var-name span {\n",
+       "  background-color: var(--xr-background-color-row-odd);\n",
+       "}\n",
+       "\n",
+       ".xr-var-name {\n",
+       "  grid-column: 1;\n",
+       "}\n",
+       "\n",
+       ".xr-var-dims {\n",
+       "  grid-column: 2;\n",
+       "}\n",
+       "\n",
+       ".xr-var-dtype {\n",
+       "  grid-column: 3;\n",
+       "  text-align: right;\n",
+       "  color: var(--xr-font-color2);\n",
+       "}\n",
+       "\n",
+       ".xr-var-preview {\n",
+       "  grid-column: 4;\n",
+       "}\n",
+       "\n",
+       ".xr-index-preview {\n",
+       "  grid-column: 2 / 5;\n",
+       "  color: var(--xr-font-color2);\n",
+       "}\n",
+       "\n",
+       ".xr-var-name,\n",
+       ".xr-var-dims,\n",
+       ".xr-var-dtype,\n",
+       ".xr-preview,\n",
+       ".xr-attrs dt {\n",
+       "  white-space: nowrap;\n",
+       "  overflow: hidden;\n",
+       "  text-overflow: ellipsis;\n",
+       "  padding-right: 10px;\n",
+       "}\n",
+       "\n",
+       ".xr-var-name:hover,\n",
+       ".xr-var-dims:hover,\n",
+       ".xr-var-dtype:hover,\n",
+       ".xr-attrs dt:hover {\n",
+       "  overflow: visible;\n",
+       "  width: auto;\n",
+       "  z-index: 1;\n",
+       "}\n",
+       "\n",
+       ".xr-var-attrs,\n",
+       ".xr-var-data,\n",
+       ".xr-index-data {\n",
+       "  display: none;\n",
+       "  background-color: var(--xr-background-color) !important;\n",
+       "  padding-bottom: 5px !important;\n",
+       "}\n",
+       "\n",
+       ".xr-var-attrs-in:checked ~ .xr-var-attrs,\n",
+       ".xr-var-data-in:checked ~ .xr-var-data,\n",
+       ".xr-index-data-in:checked ~ .xr-index-data {\n",
+       "  display: block;\n",
+       "}\n",
+       "\n",
+       ".xr-var-data > table {\n",
+       "  float: right;\n",
+       "}\n",
+       "\n",
+       ".xr-var-name span,\n",
+       ".xr-var-data,\n",
+       ".xr-index-name div,\n",
+       ".xr-index-data,\n",
+       ".xr-attrs {\n",
+       "  padding-left: 25px !important;\n",
+       "}\n",
+       "\n",
+       ".xr-attrs,\n",
+       ".xr-var-attrs,\n",
+       ".xr-var-data,\n",
+       ".xr-index-data {\n",
+       "  grid-column: 1 / -1;\n",
+       "}\n",
+       "\n",
+       "dl.xr-attrs {\n",
+       "  padding: 0;\n",
+       "  margin: 0;\n",
+       "  display: grid;\n",
+       "  grid-template-columns: 125px auto;\n",
+       "}\n",
+       "\n",
+       ".xr-attrs dt,\n",
+       ".xr-attrs dd {\n",
+       "  padding: 0;\n",
+       "  margin: 0;\n",
+       "  float: left;\n",
+       "  padding-right: 10px;\n",
+       "  width: auto;\n",
+       "}\n",
+       "\n",
+       ".xr-attrs dt {\n",
+       "  font-weight: normal;\n",
+       "  grid-column: 1;\n",
+       "}\n",
+       "\n",
+       ".xr-attrs dt:hover span {\n",
+       "  display: inline-block;\n",
+       "  background: var(--xr-background-color);\n",
+       "  padding-right: 10px;\n",
+       "}\n",
+       "\n",
+       ".xr-attrs dd {\n",
+       "  grid-column: 2;\n",
+       "  white-space: pre-wrap;\n",
+       "  word-break: break-all;\n",
+       "}\n",
+       "\n",
+       ".xr-icon-database,\n",
+       ".xr-icon-file-text2,\n",
+       ".xr-no-icon {\n",
+       "  display: inline-block;\n",
+       "  vertical-align: middle;\n",
+       "  width: 1em;\n",
+       "  height: 1.5em !important;\n",
+       "  stroke-width: 0;\n",
+       "  stroke: currentColor;\n",
+       "  fill: currentColor;\n",
+       "}\n",
+       "</style><pre class='xr-text-repr-fallback'>&lt;xarray.Dataset&gt;\n",
+       "Dimensions:               (latitude: 180, longitude: 360, months: 12)\n",
+       "Coordinates:\n",
+       "  * latitude              (latitude) float64 -89.5 -88.5 -87.5 ... 88.5 89.5\n",
+       "  * longitude             (longitude) float64 -179.5 -178.5 ... 178.5 179.5\n",
+       "  * months                (months) int32 1 2 3 4 5 6 7 8 9 10 11 12\n",
+       "Data variables:\n",
+       "    fossil                (months, latitude, longitude) float64 ...\n",
+       "    fossil_global_sum     (months) float64 ...\n",
+       "    microbial             (months, latitude, longitude) float64 ...\n",
+       "    microbial_global_sum  (months) float64 ...\n",
+       "    pyrogenic             (months, latitude, longitude) float64 ...\n",
+       "    pyrogenic_global_sum  (months) float64 ...\n",
+       "    total                 (months, latitude, longitude) float64 ...\n",
+       "    total_global_sum      (months) float64 ...\n",
+       "    surface_area          (latitude, longitude) float64 ...\n",
+       "Attributes:\n",
+       "    email:        carbontracker.team@noaa.gov\n",
+       "    url:          http://gml.noaa.gov/ccgg/carbontracker-ch4/\n",
+       "    institution:  NOAA Global Monitoring Laboratory\n",
+       "    version:      CTCH4 v2023 1x1 monthly fluxes as of 08-Nov-2024 01:58:47 UTC</pre><div class='xr-wrap' style='display:none'><div class='xr-header'><div class='xr-obj-type'>xarray.Dataset</div></div><ul class='xr-sections'><li class='xr-section-item'><input id='section-ae86dd20-c72a-4c24-a029-1d3646598f4b' class='xr-section-summary-in' type='checkbox' disabled ><label for='section-ae86dd20-c72a-4c24-a029-1d3646598f4b' class='xr-section-summary'  title='Expand/collapse section'>Dimensions:</label><div class='xr-section-inline-details'><ul class='xr-dim-list'><li><span class='xr-has-index'>latitude</span>: 180</li><li><span class='xr-has-index'>longitude</span>: 360</li><li><span class='xr-has-index'>months</span>: 12</li></ul></div><div class='xr-section-details'></div></li><li class='xr-section-item'><input id='section-1aa1ead4-a2e1-416b-9bea-dec5938ae5c7' class='xr-section-summary-in' type='checkbox'  checked><label for='section-1aa1ead4-a2e1-416b-9bea-dec5938ae5c7' class='xr-section-summary' >Coordinates: <span>(3)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><ul class='xr-var-list'><li class='xr-var-item'><div class='xr-var-name'><span class='xr-has-index'>latitude</span></div><div class='xr-var-dims'>(latitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>-89.5 -88.5 -87.5 ... 88.5 89.5</div><input id='attrs-66dd64d2-980a-4068-aba0-a2daa9035da2' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-66dd64d2-980a-4068-aba0-a2daa9035da2' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-63e4d24f-7b03-4f22-aacd-7810e63e2cec' class='xr-var-data-in' type='checkbox'><label for='data-63e4d24f-7b03-4f22-aacd-7810e63e2cec' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>degrees N</dd><dt><span>description :</span></dt><dd>latitudes of the centers of grid cells</dd></dl></div><div class='xr-var-data'><pre>array([-89.5, -88.5, -87.5, -86.5, -85.5, -84.5, -83.5, -82.5, -81.5, -80.5,\n",
+       "       -79.5, -78.5, -77.5, -76.5, -75.5, -74.5, -73.5, -72.5, -71.5, -70.5,\n",
+       "       -69.5, -68.5, -67.5, -66.5, -65.5, -64.5, -63.5, -62.5, -61.5, -60.5,\n",
+       "       -59.5, -58.5, -57.5, -56.5, -55.5, -54.5, -53.5, -52.5, -51.5, -50.5,\n",
+       "       -49.5, -48.5, -47.5, -46.5, -45.5, -44.5, -43.5, -42.5, -41.5, -40.5,\n",
+       "       -39.5, -38.5, -37.5, -36.5, -35.5, -34.5, -33.5, -32.5, -31.5, -30.5,\n",
+       "       -29.5, -28.5, -27.5, -26.5, -25.5, -24.5, -23.5, -22.5, -21.5, -20.5,\n",
+       "       -19.5, -18.5, -17.5, -16.5, -15.5, -14.5, -13.5, -12.5, -11.5, -10.5,\n",
+       "        -9.5,  -8.5,  -7.5,  -6.5,  -5.5,  -4.5,  -3.5,  -2.5,  -1.5,  -0.5,\n",
+       "         0.5,   1.5,   2.5,   3.5,   4.5,   5.5,   6.5,   7.5,   8.5,   9.5,\n",
+       "        10.5,  11.5,  12.5,  13.5,  14.5,  15.5,  16.5,  17.5,  18.5,  19.5,\n",
+       "        20.5,  21.5,  22.5,  23.5,  24.5,  25.5,  26.5,  27.5,  28.5,  29.5,\n",
+       "        30.5,  31.5,  32.5,  33.5,  34.5,  35.5,  36.5,  37.5,  38.5,  39.5,\n",
+       "        40.5,  41.5,  42.5,  43.5,  44.5,  45.5,  46.5,  47.5,  48.5,  49.5,\n",
+       "        50.5,  51.5,  52.5,  53.5,  54.5,  55.5,  56.5,  57.5,  58.5,  59.5,\n",
+       "        60.5,  61.5,  62.5,  63.5,  64.5,  65.5,  66.5,  67.5,  68.5,  69.5,\n",
+       "        70.5,  71.5,  72.5,  73.5,  74.5,  75.5,  76.5,  77.5,  78.5,  79.5,\n",
+       "        80.5,  81.5,  82.5,  83.5,  84.5,  85.5,  86.5,  87.5,  88.5,  89.5])</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span class='xr-has-index'>longitude</span></div><div class='xr-var-dims'>(longitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>-179.5 -178.5 ... 178.5 179.5</div><input id='attrs-b48a78d9-305b-4161-9eb9-184bd32e526c' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-b48a78d9-305b-4161-9eb9-184bd32e526c' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-26bbfa5b-2d77-4c33-bcbb-9f4d17a32ab2' class='xr-var-data-in' type='checkbox'><label for='data-26bbfa5b-2d77-4c33-bcbb-9f4d17a32ab2' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>degrees E</dd><dt><span>description :</span></dt><dd>longitudes of the centers of grid cells</dd></dl></div><div class='xr-var-data'><pre>array([-179.5, -178.5, -177.5, ...,  177.5,  178.5,  179.5])</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span class='xr-has-index'>months</span></div><div class='xr-var-dims'>(months)</div><div class='xr-var-dtype'>int32</div><div class='xr-var-preview xr-preview'>1 2 3 4 5 6 7 8 9 10 11 12</div><input id='attrs-d557a3dd-af3b-4e25-8a75-df30c3c71a5b' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-d557a3dd-af3b-4e25-8a75-df30c3c71a5b' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-c431b590-ff7a-4e7b-a1ce-b54c80e53929' class='xr-var-data-in' type='checkbox'><label for='data-c431b590-ff7a-4e7b-a1ce-b54c80e53929' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>description :</span></dt><dd>month of year</dd></dl></div><div class='xr-var-data'><pre>array([ 1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12], dtype=int32)</pre></div></li></ul></div></li><li class='xr-section-item'><input id='section-9cdce2b1-2279-4757-bb85-daa706e4fac6' class='xr-section-summary-in' type='checkbox'  checked><label for='section-9cdce2b1-2279-4757-bb85-daa706e4fac6' class='xr-section-summary' >Data variables: <span>(9)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><ul class='xr-var-list'><li class='xr-var-item'><div class='xr-var-name'><span>fossil</span></div><div class='xr-var-dims'>(months, latitude, longitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-7148808c-394e-42dd-ba32-2597b3b3b2c7' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-7148808c-394e-42dd-ba32-2597b3b3b2c7' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-6c3830d3-fbb4-440a-9b8a-15f241ec6128' class='xr-var-data-in' type='checkbox'><label for='data-6c3830d3-fbb4-440a-9b8a-15f241ec6128' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>g/m^2/year</dd><dt><span>description :</span></dt><dd>fossil emission of methane</dd><dt><span>unit_comment :</span></dt><dd>1 year = 365.25 days</dd><dt><span>mask_comment :</span></dt><dd>NA</dd><dt><span>annual_total :</span></dt><dd>146.6931 Tg CH4</dd></dl></div><div class='xr-var-data'><pre>[777600 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>fossil_global_sum</span></div><div class='xr-var-dims'>(months)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-d236dc36-47a1-42fd-9a96-0cfed9a93303' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-d236dc36-47a1-42fd-9a96-0cfed9a93303' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-39f6443c-8997-4d2d-ae77-61578c99b3f7' class='xr-var-data-in' type='checkbox'><label for='data-39f6443c-8997-4d2d-ae77-61578c99b3f7' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>Tg CH4</dd><dt><span>description :</span></dt><dd>Monthly global fossil methane emission</dd></dl></div><div class='xr-var-data'><pre>[12 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>microbial</span></div><div class='xr-var-dims'>(months, latitude, longitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-37067925-d226-4943-971c-e35804072b30' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-37067925-d226-4943-971c-e35804072b30' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-90d22fa1-137c-401a-88e3-08998752b411' class='xr-var-data-in' type='checkbox'><label for='data-90d22fa1-137c-401a-88e3-08998752b411' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>g/m^2/year</dd><dt><span>description :</span></dt><dd>microbial emission of methane</dd><dt><span>unit_comment :</span></dt><dd>1 year = 365.25 days</dd><dt><span>mask_comment :</span></dt><dd>NA</dd><dt><span>annual_total :</span></dt><dd>429.439 Tg CH4</dd></dl></div><div class='xr-var-data'><pre>[777600 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>microbial_global_sum</span></div><div class='xr-var-dims'>(months)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-c16eec89-458b-46d0-a0b7-ded660382a38' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-c16eec89-458b-46d0-a0b7-ded660382a38' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-7bd7e622-bf17-4534-8a9b-e8579d26bdb5' class='xr-var-data-in' type='checkbox'><label for='data-7bd7e622-bf17-4534-8a9b-e8579d26bdb5' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>Tg CH4</dd><dt><span>description :</span></dt><dd>Monthly global microbial methane emission</dd></dl></div><div class='xr-var-data'><pre>[12 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>pyrogenic</span></div><div class='xr-var-dims'>(months, latitude, longitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-3e2a3410-f9d7-4532-b2e1-0fad370f5ce4' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-3e2a3410-f9d7-4532-b2e1-0fad370f5ce4' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-8be28842-c74f-4cc1-bf3f-006e44191fcd' class='xr-var-data-in' type='checkbox'><label for='data-8be28842-c74f-4cc1-bf3f-006e44191fcd' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>g/m^2/year</dd><dt><span>description :</span></dt><dd>pyrogenic emission of methane</dd><dt><span>unit_comment :</span></dt><dd>1 year = 365.25 days</dd><dt><span>mask_comment :</span></dt><dd>NA</dd><dt><span>annual_total :</span></dt><dd>32.4211 Tg CH4</dd></dl></div><div class='xr-var-data'><pre>[777600 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>pyrogenic_global_sum</span></div><div class='xr-var-dims'>(months)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-86d9d048-e964-4c84-94d3-b1bb6823c202' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-86d9d048-e964-4c84-94d3-b1bb6823c202' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-55a06e2d-ee15-4c12-9254-f99264ae451c' class='xr-var-data-in' type='checkbox'><label for='data-55a06e2d-ee15-4c12-9254-f99264ae451c' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>Tg CH4</dd><dt><span>description :</span></dt><dd>Monthly global pyrogenic methane emission</dd></dl></div><div class='xr-var-data'><pre>[12 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>total</span></div><div class='xr-var-dims'>(months, latitude, longitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-de11a1e0-86fa-4d78-a9da-a64d5cf843cb' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-de11a1e0-86fa-4d78-a9da-a64d5cf843cb' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-f9928f3b-1f15-49f5-97b1-6ffc54bb3a66' class='xr-var-data-in' type='checkbox'><label for='data-f9928f3b-1f15-49f5-97b1-6ffc54bb3a66' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>g/m^2/year</dd><dt><span>description :</span></dt><dd>total emission of methane</dd><dt><span>unit_comment :</span></dt><dd>1 year = 365.25 days</dd><dt><span>mask_comment :</span></dt><dd>NA</dd><dt><span>annual_total :</span></dt><dd>608.5531 Tg CH4</dd></dl></div><div class='xr-var-data'><pre>[777600 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>total_global_sum</span></div><div class='xr-var-dims'>(months)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-3b25f235-51ee-49b8-964b-9ff687e38344' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-3b25f235-51ee-49b8-964b-9ff687e38344' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-fa8cbc6a-0926-4c06-9fe1-c3cc0bd77c30' class='xr-var-data-in' type='checkbox'><label for='data-fa8cbc6a-0926-4c06-9fe1-c3cc0bd77c30' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>Tg CH4</dd><dt><span>description :</span></dt><dd>Monthly global total methane emission</dd></dl></div><div class='xr-var-data'><pre>[12 values with dtype=float64]</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>surface_area</span></div><div class='xr-var-dims'>(latitude, longitude)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-f0af1123-7e0d-4a45-99a1-5011e3075bf2' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-f0af1123-7e0d-4a45-99a1-5011e3075bf2' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-5e307081-3cf9-4251-9449-68175aa609bd' class='xr-var-data-in' type='checkbox'><label for='data-5e307081-3cf9-4251-9449-68175aa609bd' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>unit :</span></dt><dd>m^2</dd><dt><span>description :</span></dt><dd>surface area of grid cells</dd><dt><span>assumed_earth_radius :</span></dt><dd>6371000.0 m</dd></dl></div><div class='xr-var-data'><pre>[64800 values with dtype=float64]</pre></div></li></ul></div></li><li class='xr-section-item'><input id='section-1ec35b9a-4b78-4ce9-8383-c482f751f29f' class='xr-section-summary-in' type='checkbox'  ><label for='section-1ec35b9a-4b78-4ce9-8383-c482f751f29f' class='xr-section-summary' >Indexes: <span>(3)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><ul class='xr-var-list'><li class='xr-var-item'><div class='xr-index-name'><div>latitude</div></div><div class='xr-index-preview'>PandasIndex</div><div></div><input id='index-36a5187c-2c56-4156-b69c-95eb49e74e3c' class='xr-index-data-in' type='checkbox'/><label for='index-36a5187c-2c56-4156-b69c-95eb49e74e3c' title='Show/Hide index repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-index-data'><pre>PandasIndex(Index([-89.5, -88.5, -87.5, -86.5, -85.5, -84.5, -83.5, -82.5, -81.5, -80.5,\n",
+       "       ...\n",
+       "        80.5,  81.5,  82.5,  83.5,  84.5,  85.5,  86.5,  87.5,  88.5,  89.5],\n",
+       "      dtype=&#x27;float64&#x27;, name=&#x27;latitude&#x27;, length=180))</pre></div></li><li class='xr-var-item'><div class='xr-index-name'><div>longitude</div></div><div class='xr-index-preview'>PandasIndex</div><div></div><input id='index-e6b5ffda-e481-4daa-8423-799a2787f432' class='xr-index-data-in' type='checkbox'/><label for='index-e6b5ffda-e481-4daa-8423-799a2787f432' title='Show/Hide index repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-index-data'><pre>PandasIndex(Index([-179.5, -178.5, -177.5, -176.5, -175.5, -174.5, -173.5, -172.5, -171.5,\n",
+       "       -170.5,\n",
+       "       ...\n",
+       "        170.5,  171.5,  172.5,  173.5,  174.5,  175.5,  176.5,  177.5,  178.5,\n",
+       "        179.5],\n",
+       "      dtype=&#x27;float64&#x27;, name=&#x27;longitude&#x27;, length=360))</pre></div></li><li class='xr-var-item'><div class='xr-index-name'><div>months</div></div><div class='xr-index-preview'>PandasIndex</div><div></div><input id='index-ca771e74-ad21-4c8c-997a-d03fcfa529ab' class='xr-index-data-in' type='checkbox'/><label for='index-ca771e74-ad21-4c8c-997a-d03fcfa529ab' title='Show/Hide index repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-index-data'><pre>PandasIndex(Index([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], dtype=&#x27;int32&#x27;, name=&#x27;months&#x27;))</pre></div></li></ul></div></li><li class='xr-section-item'><input id='section-aa30a9db-6743-4bdc-b8d3-8d999b585ec8' class='xr-section-summary-in' type='checkbox'  checked><label for='section-aa30a9db-6743-4bdc-b8d3-8d999b585ec8' class='xr-section-summary' >Attributes: <span>(4)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><dl class='xr-attrs'><dt><span>email :</span></dt><dd>carbontracker.team@noaa.gov</dd><dt><span>url :</span></dt><dd>http://gml.noaa.gov/ccgg/carbontracker-ch4/</dd><dt><span>institution :</span></dt><dd>NOAA Global Monitoring Laboratory</dd><dt><span>version :</span></dt><dd>CTCH4 v2023 1x1 monthly fluxes as of 08-Nov-2024 01:58:47 UTC</dd></dl></div></li></ul></div></div>"
+      ],
+      "text/plain": [
+       "<xarray.Dataset>\n",
+       "Dimensions:               (latitude: 180, longitude: 360, months: 12)\n",
+       "Coordinates:\n",
+       "  * latitude              (latitude) float64 -89.5 -88.5 -87.5 ... 88.5 89.5\n",
+       "  * longitude             (longitude) float64 -179.5 -178.5 ... 178.5 179.5\n",
+       "  * months                (months) int32 1 2 3 4 5 6 7 8 9 10 11 12\n",
+       "Data variables:\n",
+       "    fossil                (months, latitude, longitude) float64 ...\n",
+       "    fossil_global_sum     (months) float64 ...\n",
+       "    microbial             (months, latitude, longitude) float64 ...\n",
+       "    microbial_global_sum  (months) float64 ...\n",
+       "    pyrogenic             (months, latitude, longitude) float64 ...\n",
+       "    pyrogenic_global_sum  (months) float64 ...\n",
+       "    total                 (months, latitude, longitude) float64 ...\n",
+       "    total_global_sum      (months) float64 ...\n",
+       "    surface_area          (latitude, longitude) float64 ...\n",
+       "Attributes:\n",
+       "    email:        carbontracker.team@noaa.gov\n",
+       "    url:          http://gml.noaa.gov/ccgg/carbontracker-ch4/\n",
+       "    institution:  NOAA Global Monitoring Laboratory\n",
+       "    version:      CTCH4 v2023 1x1 monthly fluxes as of 08-Nov-2024 01:58:47 UTC"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "# Read a file of the new dataset\n",
-    "name = 'test.nc'\n",
+    "name = '/Users/vgaur/Downloads/CTCH4_methane_emis_1998.nc'\n",
     "ds = xarray.open_dataset(name) # open the file\n",
     "print('The netcdf file contains information as shown below')\n",
     "ds"
@@ -34,9 +483,27 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Data valriables in the netCDF file are Data variables:\n",
+      "    fossil                (months, latitude, longitude) float64 ...\n",
+      "    fossil_global_sum     (months) float64 ...\n",
+      "    microbial             (months, latitude, longitude) float64 ...\n",
+      "    microbial_global_sum  (months) float64 ...\n",
+      "    pyrogenic             (months, latitude, longitude) float64 ...\n",
+      "    pyrogenic_global_sum  (months) float64 ...\n",
+      "    total                 (months, latitude, longitude) float64 ...\n",
+      "    total_global_sum      (months) float64 ...\n",
+      "    surface_area          (latitude, longitude) float64 ...\n",
+      "Dimensions mentioned in the netCDF file are Frozen({'latitude': 180, 'longitude': 360, 'months': 12})\n"
+     ]
+    }
+   ],
    "source": [
     "# Explore the netCDF file\n",
     "print('Data valriables in the netCDF file are', ds.data_vars)\n",
@@ -46,7 +513,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -83,6 +550,104 @@
     "        cog_filename = f\"{cog_filename}.tif\""
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CTCH4_methane_fossil_emis_199801.tif\n",
+      "CTCH4_methane_microbial_emis_199801.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199801.tif\n",
+      "CTCH4_methane_total_emis_199801.tif\n",
+      "CTCH4_methane_surface_area_emis_199801.tif\n",
+      "CTCH4_methane_fossil_emis_199802.tif\n",
+      "CTCH4_methane_microbial_emis_199802.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199802.tif\n",
+      "CTCH4_methane_total_emis_199802.tif\n",
+      "CTCH4_methane_surface_area_emis_199802.tif\n",
+      "CTCH4_methane_fossil_emis_199803.tif\n",
+      "CTCH4_methane_microbial_emis_199803.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199803.tif\n",
+      "CTCH4_methane_total_emis_199803.tif\n",
+      "CTCH4_methane_surface_area_emis_199803.tif\n",
+      "CTCH4_methane_fossil_emis_199804.tif\n",
+      "CTCH4_methane_microbial_emis_199804.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199804.tif\n",
+      "CTCH4_methane_total_emis_199804.tif\n",
+      "CTCH4_methane_surface_area_emis_199804.tif\n",
+      "CTCH4_methane_fossil_emis_199805.tif\n",
+      "CTCH4_methane_microbial_emis_199805.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199805.tif\n",
+      "CTCH4_methane_total_emis_199805.tif\n",
+      "CTCH4_methane_surface_area_emis_199805.tif\n",
+      "CTCH4_methane_fossil_emis_199806.tif\n",
+      "CTCH4_methane_microbial_emis_199806.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199806.tif\n",
+      "CTCH4_methane_total_emis_199806.tif\n",
+      "CTCH4_methane_surface_area_emis_199806.tif\n",
+      "CTCH4_methane_fossil_emis_199807.tif\n",
+      "CTCH4_methane_microbial_emis_199807.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199807.tif\n",
+      "CTCH4_methane_total_emis_199807.tif\n",
+      "CTCH4_methane_surface_area_emis_199807.tif\n",
+      "CTCH4_methane_fossil_emis_199808.tif\n",
+      "CTCH4_methane_microbial_emis_199808.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199808.tif\n",
+      "CTCH4_methane_total_emis_199808.tif\n",
+      "CTCH4_methane_surface_area_emis_199808.tif\n",
+      "CTCH4_methane_fossil_emis_199809.tif\n",
+      "CTCH4_methane_microbial_emis_199809.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199809.tif\n",
+      "CTCH4_methane_total_emis_199809.tif\n",
+      "CTCH4_methane_surface_area_emis_199809.tif\n",
+      "CTCH4_methane_fossil_emis_199810.tif\n",
+      "CTCH4_methane_microbial_emis_199810.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199810.tif\n",
+      "CTCH4_methane_total_emis_199810.tif\n",
+      "CTCH4_methane_surface_area_emis_199810.tif\n",
+      "CTCH4_methane_fossil_emis_199811.tif\n",
+      "CTCH4_methane_microbial_emis_199811.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199811.tif\n",
+      "CTCH4_methane_total_emis_199811.tif\n",
+      "CTCH4_methane_surface_area_emis_199811.tif\n",
+      "CTCH4_methane_fossil_emis_199812.tif\n",
+      "CTCH4_methane_microbial_emis_199812.tif\n",
+      "CTCH4_methane_pyrogenic_emis_199812.tif\n",
+      "CTCH4_methane_total_emis_199812.tif\n",
+      "CTCH4_methane_surface_area_emis_199812.tif\n"
+     ]
+    }
+   ],
+   "source": [
+    "variable = [var for var in ds.data_vars if \"global\" not in var]\n",
+    "\n",
+    "for time_increment in range(0, len(ds.months)):\n",
+    "    filename = name.split(\"/\")[-1]\n",
+    "    filename_elements = re.split(\"[_ .]\", filename)\n",
+    "    start_time = datetime(int(filename_elements[-2]), time_increment + 1, 1)\n",
+    "    for var in variable:\n",
+    "        filename = name.split(\"/\")[-1]\n",
+    "        filename_elements = re.split(\"[_ .]\", filename)\n",
+    "        data = getattr(ds.isel(months=time_increment), var)\n",
+    "        data = data.isel(lat=slice(None, None, -1))\n",
+    "        data = data.where(data != -9999, -9999)\n",
+    "        data.rio.set_spatial_dims(\"lon\", \"lat\", inplace=True)\n",
+    "        data.rio.write_crs(\"epsg:4326\", inplace=True)\n",
+    "        data.rio.write_nodata(-9999, inplace=True)\n",
+    "\n",
+    "        # # insert date of generated COG into filename\n",
+    "        filename_elements.pop()\n",
+    "        filename_elements[-1] = start_time.strftime(\"%Y%m\")\n",
+    "        filename_elements.insert(2, var)\n",
+    "        cog_filename = \"_\".join(filename_elements)\n",
+    "        # # add extension\n",
+    "        cog_filename = f\"{cog_filename}.tif\""
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -93,8 +658,22 @@
   }
  ],
  "metadata": {
+  "kernelspec": {
+   "display_name": "cmip6",
+   "language": "python",
+   "name": "python3"
+  },
   "language_info": {
-   "name": "python"
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
   }
  },
  "nbformat": 4,
diff --git a/data_transformation_plugins/tm54dvar_noaa_transformation.py b/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
similarity index 91%
rename from data_transformation_plugins/tm54dvar_noaa_transformation.py
rename to data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
index 7565ec8a..1fd491b3 100644
--- a/data_transformation_plugins/tm54dvar_noaa_transformation.py
+++ b/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
@@ -2,7 +2,7 @@
 from datetime import datetime
 import re
 
-def tm54dvar_ch4flux_mask_monthgrid_v5_transformation(file_obj, name, nodata):
+def tm5_4dvar_update_noaa_transformation(file_obj, name, nodata):
     """Tranformation function for the tm5 ch4 influx dataset
 
     Args:
@@ -25,6 +25,8 @@ def tm54dvar_ch4flux_mask_monthgrid_v5_transformation(file_obj, name, nodata):
         filename_elements = re.split("[_ .]", filename)
         start_time = datetime(int(filename_elements[-2]), time_increment + 1, 1)
         for var in variable:
+            filename = name.split("/")[-1]
+            filename_elements = re.split("[_ .]", filename)
             data = getattr(xds.isel(months=time_increment), var)
             data = data.isel(lat=slice(None, None, -1))
             data = data.where(data != nodata, -9999)

From e6a6ee9ae51d820b30f71da91fdd13252568ff87 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Tue, 19 Nov 2024 11:11:45 -0600
Subject: [PATCH 12/13] reformatting files

---
 .../ecco_darwin_transformation.py             | 14 ++++++-----
 .../geos_oco2_transformation.py               |  6 +++--
 .../gosat_ch4_transformation.py               |  8 ++++---
 .../gpw_transformation.py                     |  8 ++++---
 data_transformation_plugins/push_to_s3.py     | 24 +++++++++++++------
 .../tm5_4dvar_update_noaa_transformation.py   |  8 ++++---
 6 files changed, 44 insertions(+), 24 deletions(-)

diff --git a/data_transformation_plugins/ecco_darwin_transformation.py b/data_transformation_plugins/ecco_darwin_transformation.py
index b31c2c13..93be21cd 100644
--- a/data_transformation_plugins/ecco_darwin_transformation.py
+++ b/data_transformation_plugins/ecco_darwin_transformation.py
@@ -1,6 +1,8 @@
-import xarray
 import re
 
+import xarray
+
+
 def ecco_darwin_transformation(file_obj, name, nodata):
     """Tranformation function for the ecco darwin dataset
 
@@ -15,9 +17,9 @@ def ecco_darwin_transformation(file_obj, name, nodata):
     var_data_netcdf = {}
     xds = xarray.open_dataset(file_obj)
     xds = xds.rename({"y": "latitude", "x": "longitude"})
-    xds = xds.assign_coords(longitude=((xds.longitude / 1440) * 360) - 180).sortby(
-        "longitude"
-    )
+    xds = xds.assign_coords(
+        longitude=((xds.longitude / 1440) * 360) - 180
+    ).sortby("longitude")
     xds = xds.assign_coords(latitude=((xds.latitude / 721) * 180) - 90).sortby(
         "latitude"
     )
@@ -43,5 +45,5 @@ def ecco_darwin_transformation(file_obj, name, nodata):
         # # add extension
         cog_filename = f"{cog_filename}.tif"
         var_data_netcdf[cog_filename] = data
-        
-    return var_data_netcdf
\ No newline at end of file
+
+    return var_data_netcdf
diff --git a/data_transformation_plugins/geos_oco2_transformation.py b/data_transformation_plugins/geos_oco2_transformation.py
index 4165c91e..61b9702a 100644
--- a/data_transformation_plugins/geos_oco2_transformation.py
+++ b/data_transformation_plugins/geos_oco2_transformation.py
@@ -1,6 +1,8 @@
-import xarray
 import re
 
+import xarray
+
+
 def geos_oco2_transformation(file_obj, name, nodata):
     """Tranformation function for the oco2 geos dataset
 
@@ -35,4 +37,4 @@ def geos_oco2_transformation(file_obj, name, nodata):
             cog_filename = f"{cog_filename}.tif"
             var_data_netcdf[cog_filename] = data
 
-    return var_data_netcdf
\ No newline at end of file
+    return var_data_netcdf
diff --git a/data_transformation_plugins/gosat_ch4_transformation.py b/data_transformation_plugins/gosat_ch4_transformation.py
index 7a88b85f..ea5552ec 100644
--- a/data_transformation_plugins/gosat_ch4_transformation.py
+++ b/data_transformation_plugins/gosat_ch4_transformation.py
@@ -1,6 +1,8 @@
-import xarray
 import re
 
+import xarray
+
+
 def gosat_ch4_transformation(file_obj, name, nodata):
     """Tranformation function for the ecco darwin dataset
 
@@ -33,5 +35,5 @@ def gosat_ch4_transformation(file_obj, name, nodata):
         data.rio.set_spatial_dims("lon", "lat")
         data.rio.write_crs("epsg:4326", inplace=True)
         var_data_netcdf[cog_filename] = data
-    
-    return var_data_netcdf
\ No newline at end of file
+
+    return var_data_netcdf
diff --git a/data_transformation_plugins/gpw_transformation.py b/data_transformation_plugins/gpw_transformation.py
index fde5d1f7..fb1e99d8 100644
--- a/data_transformation_plugins/gpw_transformation.py
+++ b/data_transformation_plugins/gpw_transformation.py
@@ -1,6 +1,8 @@
-import xarray
 import re
 
+import xarray
+
+
 def gpw_transformation(file_obj, name, nodata):
     """Tranformation function for the gridded population dataset
 
@@ -30,5 +32,5 @@ def gpw_transformation(file_obj, name, nodata):
     # # add extension
     cog_filename = f"{cog_filename}.tif"
     var_data_netcdf[cog_filename] = xds
-    
-    return var_data_netcdf
\ No newline at end of file
+
+    return var_data_netcdf
diff --git a/data_transformation_plugins/push_to_s3.py b/data_transformation_plugins/push_to_s3.py
index 7f941bc9..03cdfaa6 100644
--- a/data_transformation_plugins/push_to_s3.py
+++ b/data_transformation_plugins/push_to_s3.py
@@ -1,8 +1,7 @@
-import boto3
 import os
 
 import boto3
-import os
+
 
 def upload_files_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
     """
@@ -16,23 +15,23 @@ def upload_files_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
     - exclude_files (list): List of files to exclude from uploading.
     """
     # Initialize S3 client
-    s3 = boto3.client('s3')
+    s3 = boto3.client("s3")
 
     # Loop through files in the local folder
     for file_name in os.listdir(folder_path):
         file_path = os.path.join(folder_path, file_name)
-        
+
         # Check if it's a file and not in the exclude list
         if os.path.isfile(file_path) and file_name not in exclude_files:
             s3_key = os.path.join(s3_folder, file_name)
-            
+
             try:
                 # Check if the file already exists in S3
                 s3.head_object(Bucket=bucket_name, Key=s3_key)
                 print(f"Skipped {file_name} (already exists in S3)")
             except s3.exceptions.ClientError as e:
                 # If the file does not exist, upload it
-                if e.response['Error']['Code'] == '404':
+                if e.response["Error"]["Code"] == "404":
                     try:
                         s3.upload_file(file_path, bucket_name, s3_key)
                         print(f"Uploaded {file_name} to {s3_key}")
@@ -41,7 +40,18 @@ def upload_files_to_s3(folder_path, bucket_name, s3_folder, exclude_files):
                 else:
                     print(f"Error checking existence of {file_name}: {e}")
 
+
 # Example usage:
 # upload_folder_to_s3("path/to/local/folder", "my-s3-bucket", "my/s3/folder", ["exclude1.ext", "exclude2.ext"])
 if __name__ == "__main__":
-    upload_files_to_s3("data_transformation_plugins", "ghgc-data-store-develop", "data_transformation_plugins", ["__init__.py", "push_to_s3.py", "README.md", "sample_transformation.ipynb"])
\ No newline at end of file
+    upload_files_to_s3(
+        "data_transformation_plugins",
+        "ghgc-data-store-develop",
+        "data_transformation_plugins",
+        [
+            "__init__.py",
+            "push_to_s3.py",
+            "README.md",
+            "sample_transformation.ipynb",
+        ],
+    )
diff --git a/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py b/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
index 1fd491b3..a7f3a8ac 100644
--- a/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
+++ b/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
@@ -1,6 +1,8 @@
-import xarray
-from datetime import datetime
 import re
+from datetime import datetime
+
+import xarray
+
 
 def tm5_4dvar_update_noaa_transformation(file_obj, name, nodata):
     """Tranformation function for the tm5 ch4 influx dataset
@@ -43,4 +45,4 @@ def tm5_4dvar_update_noaa_transformation(file_obj, name, nodata):
             cog_filename = f"{cog_filename}.tif"
             var_data_netcdf[cog_filename] = data
 
-    return var_data_netcdf
\ No newline at end of file
+    return var_data_netcdf

From 6c85d0ca6bd56e2d6028476358942da33bb4bc00 Mon Sep 17 00:00:00 2001
From: vishal <vishal.gaur@uah.edu>
Date: Wed, 20 Nov 2024 10:01:32 -0600
Subject: [PATCH 13/13] reformatting files along with resolving the comments

---
 .../ecco_darwin_transformation.py                     |  9 +++++++--
 .../geos_oco2_transformation.py                       |  9 +++++++--
 .../gosat_ch4_transformation.py                       | 11 ++++++++---
 data_transformation_plugins/gpw_transformation.py     |  9 +++++++--
 .../tm5_4dvar_update_noaa_transformation.py           |  9 +++++++--
 5 files changed, 36 insertions(+), 11 deletions(-)

diff --git a/data_transformation_plugins/ecco_darwin_transformation.py b/data_transformation_plugins/ecco_darwin_transformation.py
index 93be21cd..9eb518b0 100644
--- a/data_transformation_plugins/ecco_darwin_transformation.py
+++ b/data_transformation_plugins/ecco_darwin_transformation.py
@@ -1,10 +1,15 @@
 import re
+from typing import Dict
 
 import xarray
+from s3fs import S3File
+from xarray import DataArray
 
 
-def ecco_darwin_transformation(file_obj, name, nodata):
-    """Tranformation function for the ecco darwin dataset
+def ecco_darwin_transformation(
+    file_obj: S3File, name: str, nodata: int
+) -> Dict[str, DataArray]:
+    """Transformation function for the ecco darwin dataset
 
     Args:
         file_obj (s3fs object): s3fs sile object for one file of the dataset
diff --git a/data_transformation_plugins/geos_oco2_transformation.py b/data_transformation_plugins/geos_oco2_transformation.py
index 61b9702a..dc18dfbc 100644
--- a/data_transformation_plugins/geos_oco2_transformation.py
+++ b/data_transformation_plugins/geos_oco2_transformation.py
@@ -1,10 +1,15 @@
 import re
+from typing import Dict
 
 import xarray
+from s3fs import S3File
+from xarray import DataArray
 
 
-def geos_oco2_transformation(file_obj, name, nodata):
-    """Tranformation function for the oco2 geos dataset
+def geos_oco2_transformation(
+    file_obj: S3File, name: str, nodata: int
+) -> Dict[str, DataArray]:
+    """Transformation function for the oco2 geos dataset
 
     Args:
         file_obj (s3fs object): s3fs sile object for one file of the dataset
diff --git a/data_transformation_plugins/gosat_ch4_transformation.py b/data_transformation_plugins/gosat_ch4_transformation.py
index ea5552ec..ac299264 100644
--- a/data_transformation_plugins/gosat_ch4_transformation.py
+++ b/data_transformation_plugins/gosat_ch4_transformation.py
@@ -1,10 +1,15 @@
 import re
+from typing import Dict
 
 import xarray
+from s3fs import S3File
+from xarray import DataArray
 
 
-def gosat_ch4_transformation(file_obj, name, nodata):
-    """Tranformation function for the ecco darwin dataset
+def gosat_ch4_transformation(
+    file_obj: S3File, name: str, nodata: int
+) -> Dict[str, DataArray]:
+    """Transformation function for the ecco darwin dataset
 
     Args:
         file_obj (s3fs object): s3fs sile object for one file of the dataset
@@ -29,7 +34,7 @@ def gosat_ch4_transformation(file_obj, name, nodata):
         cog_filename = f"{cog_filename}.tif"
 
         data = data.reindex(lat=list(reversed(data.lat)))
-        data = data.where(data != -9999, -9999)
+        data = data.where(data != nodata, -9999)
         data.rio.write_nodata(-9999, inplace=True)
 
         data.rio.set_spatial_dims("lon", "lat")
diff --git a/data_transformation_plugins/gpw_transformation.py b/data_transformation_plugins/gpw_transformation.py
index fb1e99d8..9db17e90 100644
--- a/data_transformation_plugins/gpw_transformation.py
+++ b/data_transformation_plugins/gpw_transformation.py
@@ -1,10 +1,15 @@
 import re
+from typing import Dict
 
 import xarray
+from s3fs import S3File
+from xarray import DataArray
 
 
-def gpw_transformation(file_obj, name, nodata):
-    """Tranformation function for the gridded population dataset
+def gpw_transformation(
+    file_obj: S3File, name: str, nodata: int
+) -> Dict[str, DataArray]:
+    """Transformation function for the gridded population dataset
 
     Args:
         file_obj (s3fs object): s3fs sile object for one file of the dataset
diff --git a/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py b/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
index a7f3a8ac..8b13fc79 100644
--- a/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
+++ b/data_transformation_plugins/tm5_4dvar_update_noaa_transformation.py
@@ -1,11 +1,16 @@
 import re
 from datetime import datetime
+from typing import Dict
 
 import xarray
+from s3fs import S3File
+from xarray import DataArray
 
 
-def tm5_4dvar_update_noaa_transformation(file_obj, name, nodata):
-    """Tranformation function for the tm5 ch4 influx dataset
+def tm5_4dvar_update_noaa_transformation(
+    file_obj: S3File, name: str, nodata: int
+) -> Dict[str, DataArray]:
+    """Transformation function for the tm5 ch4 influx dataset
 
     Args:
         file_obj (s3fs object): s3fs sile object for one file of the dataset