diff --git a/.devcontainer/devcontainer.json b/.devcontainer/devcontainer.json
new file mode 100644
index 00000000..5ca24e93
--- /dev/null
+++ b/.devcontainer/devcontainer.json
@@ -0,0 +1,16 @@
+{
+  "name": "frdc",
+  "build": {
+    "dockerfile": "../Dockerfile",
+  },
+  "containerEnv": {
+    "LABEL_STUDIO_HOST": "host.docker.internal",
+    "LABEL_STUDIO_API_KEY": "${localEnv:LABEL_STUDIO_API_KEY}",
+  },
+  "runArgs": [
+    "--gpus=all",
+  ],
+  "hostRequirements": {
+    "gpu": true,
+  }
+}
\ No newline at end of file
diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 00000000..d28cb2fc
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1 @@
+Dockerfile text=auto eol=lf
\ No newline at end of file
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 00000000..526daecb
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,20 @@
+FROM pytorch/pytorch:2.1.2-cuda12.1-cudnn8-runtime as torch
+WORKDIR /devcontainer
+
+COPY ./pyproject.toml /devcontainer/pyproject.toml
+
+RUN apt update -y && apt upgrade -y
+RUN apt install git -y
+
+RUN pip3 install --upgrade pip && \
+    pip3 install poetry && \
+    pip3 install lightning
+
+RUN conda init bash \
+    && . ~/.bashrc \
+    && conda activate base \
+    && poetry config virtualenvs.create false \
+    && poetry install --with dev --no-interaction --no-ansi
+
+RUN apt install curl -y && curl -sSL https://sdk.cloud.google.com | bash
+ENV PATH $PATH:/root/google-cloud-sdk/bin
diff --git a/README.md b/README.md
index 9ddd6c92..d497d13a 100644
--- a/README.md
+++ b/README.md
@@ -54,14 +54,6 @@ To illustrate this, take a look at how
 `tests/model_tests/chestnut_dec_may/train.py` is written. It pulls in relevant
 modules from each stage and constructs a pipeline.
 
-
-> Initially, we evaluated a few ML E2E solutions, despite them offering great
-> functionality, their flexibility was
-> limited. From a dev perspective, **Active Learning** was a gray area, and we
-> foresee heavy shoehorning.
-> Ultimately, we decided that the risk was too great, thus we resort to
-> creating our own solution.
-
 ## Contributing
 
 ### Pre-commit Hooks
@@ -80,3 +72,5 @@ If you're using `pip` instead of `poetry`, run the following commands:
 pip install pre-commit
 pre-commit install
 ```
+
+Alternatively, you can use Black configured with your own IDE.
diff --git a/Writerside/d.tree b/Writerside/d.tree
index 27fe88b4..32778cf1 100644
--- a/Writerside/d.tree
+++ b/Writerside/d.tree
@@ -8,7 +8,9 @@
                   start-page="Overview.md">
 
     <toc-element topic="Overview.md"/>
-    <toc-element topic="Getting-Started.md"/>
+    <toc-element topic="Getting-Started.md">
+        <toc-element topic="Get-Started-with-Dev-Containers.md"/>
+    </toc-element>
     <toc-element toc-title="Tutorials">
         <toc-element topic="Retrieve-our-Datasets.md"/>
     </toc-element>
diff --git a/Writerside/topics/Get-Started-with-Dev-Containers.md b/Writerside/topics/Get-Started-with-Dev-Containers.md
new file mode 100644
index 00000000..750bead5
--- /dev/null
+++ b/Writerside/topics/Get-Started-with-Dev-Containers.md
@@ -0,0 +1,49 @@
+# Get Started with Dev Containers
+
+Dev. Containers are a great way to get started with a project. They define all
+necessary dependencies and environments, so you can just start coding within
+the container.
+
+In this article, we'll only go over **additional steps** to set up with our
+project. For more information on how to use Dev Containers, please refer to
+the official documentation for each IDE. Once you've set up the Dev Container,
+come back here to finish the setup:
+
+- [VSCode](https://code.visualstudio.com/docs/remote/containers).
+- [IntelliJ](https://www.jetbrains.com/help/idea/connect-to-devcontainer.html)
+
+> If you see the error `Error response from daemon: ... <!DOCTYPE`, you forgot
+> the `.git` at the end of the repo URL.
+{style='warning'}
+
+## Python Environment
+
+> Do not create a new environment
+{style='warning'}
+
+The dev environment is already created and is managed by Anaconda 
+`/opt/conda/bin/conda`. 
+To activate the environment, run the following command:
+
+```bash
+conda activate base
+```
+
+> Refer to your respective IDE's documentation on how to activate the
+> environment.
+
+## Mark as Sources Root (Add to PYTHONPATH)
+
+For `import` statements to work, you need to mark the `src` folder as the
+sources root. Optionally, also mark the `tests` folder as the tests root.
+
+> Refer to your respective IDE's documentation on how to mark folders as
+> sources root. (Also known as adding to the `PYTHONPATH`)
+
+## Additional Setup
+
+Refer to the [Getting Started](Getting-Started.md) guide for additional setup
+steps such as:
+- Google Cloud Application Default Credentials
+- Weight & Bias API Key
+- Label Studio API Key
diff --git a/Writerside/topics/Getting-Started.md b/Writerside/topics/Getting-Started.md
index 7615174d..c62ee26f 100644
--- a/Writerside/topics/Getting-Started.md
+++ b/Writerside/topics/Getting-Started.md
@@ -1,5 +1,7 @@
 # Getting Started
 
+> Want to use a Dev Container? See [Get Started with Dev Containers](Get-Started-with-Dev-Containers.md)
+
 <procedure title="Installing the Dev. Environment" id="install">
     <step>Ensure that you have the right version of Python.
         The required Python version can be seen in <code>pyproject.toml</code>
@@ -10,7 +12,7 @@
     </step>
     <step>Start by cloning our repository.
         <code-block lang="shell">
-          git clone https://github.com/Forest-Recovery-Digital-Companion/FRDC-ML.git
+          git clone https://github.com/FR-DC/FRDC-ML.git
         </code-block>
     </step>
     <step>Then, create a Python Virtual Env <code>pyvenv</code>
@@ -60,6 +62,7 @@
     </step>
 </procedure>
 
+
 <procedure title="Setting Up Google Cloud" id="gcloud">
     <step>
         We use Google Cloud to store our datasets. To set up Google Cloud,
@@ -86,6 +89,48 @@
     </step>
 </procedure>
 
+<procedure title="Setting Up Label Studio" id="ls">
+    <tip>This is only necessary if any task requires Label Studio annotations</tip>
+    <step>
+        We use Label Studio to annotate our datasets.
+        We won't go through how to install Label Studio, for contributors, it
+        should be up on <code>localhost:8080</code>.
+    </step>
+    <step>
+        Then, retrieve your own API key from Label Studio.
+        <a href="http://localhost:8080/user/account"> Go to your account page </a>
+        and copy the API key. <br/></step>
+    <step> Set your API key as an environment variable.
+        <tabs>
+<tab title="Windows">
+        In Windows, go to "Edit environment variables for
+        your account" and add this as a new environment variable with name
+        <code>LABEL_STUDIO_API_KEY</code>.
+</tab>
+<tab title="Linux">
+        Export it as an environment variable.
+        <code-block lang="shell">export LABEL_STUDIO_API_KEY=...</code-block>
+</tab>
+</tabs>
+    </step>
+</procedure>
+
+<procedure title="Setting Up Weight and Biases" id="wandb">
+    <step>
+        We use W&B to track our experiments. To set up W&B,
+        <a href="https://docs.wandb.ai/quickstart">
+          install the W&B CLI
+        </a>
+    </step>
+    <step>
+        Then, 
+        <a href="https://docs.wandb.ai/quickstart">
+          authenticate your account
+        </a>.
+        <code-block lang="shell">wandb login</code-block>
+    </step>
+</procedure>
+
 <procedure title="Pre-commit Hooks" collapsible="true">
     <note>This is optional but recommended.
     Pre-commit hooks are a way to ensure that your code is formatted correctly.
@@ -98,30 +143,45 @@
     </step>
 </procedure>
 
-<procedure title="Running the Tests" collapsible="true" id="tests">
+<procedure title="Running the Tests" id="tests">
     <step>
         Run the tests to make sure everything is working
         <code-block lang="shell">
             pytest
         </code-block>
     </step>
-<step>
-    In case of errors:
-    <deflist>
-        <def title="google.auth.exceptions.DefaultCredentialsError">
-            If you get this error, it means that you haven't authenticated your
-            Google Cloud account.
-            See <a anchor="gcloud">Setting Up Google Cloud</a>
-        </def>
-        <def title="ModuleNotFoundError" collapsible="true">
-            If you get this error, it means that you haven't installed the
-            dependencies.
-            See <a anchor="install">Installing the Dev. Environment</a>
-        </def>
-    </deflist>
-</step>
 </procedure>
 
+## Troubleshooting
+
+### ModuleNotFoundError
+
+It's likely that your `src` and `tests` directories are not in `PYTHONPATH`.
+To fix this, run the following command:
+
+```shell
+export PYTHONPATH=$PYTHONPATH:./src:./tests
+```
+
+Or, set it in your IDE, for example, IntelliJ allows setting directories as
+**Source Roots**.
+
+### google.auth.exceptions.DefaultCredentialsError
+
+It's likely that you haven't authenticated your Google Cloud account.
+See [Setting Up Google Cloud](#gcloud)
+
+### Couldn't connect to Label Studio
+
+Label Studio must be running locally, exposed on `localhost:8080`. Furthermore,
+you need to specify the `LABEL_STUDIO_API_KEY` environment variable. See 
+[Setting Up Label Studio](#ls)
+
+### Cannot login to W&B
+
+You need to authenticate your W&B account. See [Setting Up Weight and Biases](#wandb)
+If you're facing difficulties, set the `WANDB_MODE` environment variable to `offline`
+to disable W&B.
 
 ## Our Repository Structure
 
@@ -132,7 +192,6 @@ help you understand where to put your code.
 graph LR
     FRDC -- " Core Dependencies " --> src/frdc/
     FRDC -- " Resources " --> rsc/
-    FRDC -- " Pipeline " --> pipeline/
     FRDC -- " Tests " --> tests/
     FRDC -- " Repo Dependencies " --> pyproject.toml,poetry.lock
     src/frdc/ -- " Dataset Loaders " --> ./load/
@@ -140,7 +199,6 @@ graph LR
     src/frdc/ -- " Train Deps " --> ./train/
     src/frdc/ -- " Model Architectures " --> ./models/
     rsc/ -- " Datasets ... " --> ./dataset_name/
-    pipeline/ -- " Model Training Pipeline " --> ./model_tests/
 ```
 
 src/frdc/
@@ -149,11 +207,8 @@ src/frdc/
 rsc/
 : Resources. These are usually cached datasets
 
-pipeline/
-: Pipeline code. These are the full ML tests of our pipeline.
-
 tests/
-: PyTest tests. These are unit tests & integration tests.
+: PyTest tests. These are unit, integration, and model tests.
 
 ### Unit, Integration, and Pipeline Tests
 
@@ -161,7 +216,7 @@ We have 3 types of tests:
 
 - Unit Tests are usually small, single function tests.
 - Integration Tests are larger tests that tests a mock pipeline.
-- Pipeline Tests are the true production pipeline tests that will generate a
+- Model Tests are the true production pipeline tests that will generate a
   model.
 
 ### Where Should I contribute?
@@ -176,9 +231,9 @@ at the <code>src/frdc/</code> directory.
 By adding a new component, you'll need to add a new test. Take a look at the
 <code>tests/</code> directory.
 </def>
-<def title="Changing the pipeline">
+<def title="Changing the model pipeline">
 If you're a ML Researcher, you'll probably be changing the pipeline. Take a
-look at the <code>pipeline/</code> directory.
+look at the <code>tests/model_tests/</code> directory.
 </def>
 <def title="Adding a dependency">
 If you're adding a new dependency, use <code>poetry add PACKAGE</code> and
diff --git a/Writerside/topics/Retrieve-our-Datasets.md b/Writerside/topics/Retrieve-our-Datasets.md
index 46141afe..9c671cbd 100644
--- a/Writerside/topics/Retrieve-our-Datasets.md
+++ b/Writerside/topics/Retrieve-our-Datasets.md
@@ -25,16 +25,17 @@ Here, we'll download and load our
 - `labels`: The labels of the trees (segments)
 
 ```python
-from frdc.load.dataset import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 
-ds = FRDCDataset(site="chestnut_nature_park", date="20201218", version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 ```
 
 ### What Datasets are there? {collapsible="true"}
 
-> To know what datasets are available, you can run
+> We recommend to use FRDCDatasetPreset. However, if you want  
+> to know what other datasets are available, you can run
 > [load.gcs](load.gcs.md)'s `list_gcs_datasets()`
 > method
 
@@ -86,10 +87,10 @@ To segment the data, use [Extract Segments](preprocessing.extract_segments.md).
 Here, we'll segment the data by the bounds.
 
 ```python
-from frdc.load.dataset import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.extract_segments import extract_segments_from_bounds
 
-ds = FRDCDataset(site="chestnut_nature_park", date="20201218", version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 segments = extract_segments_from_bounds(ar, bounds)
@@ -109,11 +110,11 @@ We can then use these data to plot out the first tree segment.
 ```python
 import matplotlib.pyplot as plt
 
-from frdc.load.dataset import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.extract_segments import extract_segments_from_bounds
 from frdc.preprocess.scale import scale_0_1_per_band
 
-ds = FRDCDataset(site="chestnut_nature_park", date="20201218", version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 segments = extract_segments_from_bounds(ar, bounds)
diff --git a/Writerside/topics/load.dataset.md b/Writerside/topics/load.dataset.md
index e5a57699..7cbf6cbc 100644
--- a/Writerside/topics/load.dataset.md
+++ b/Writerside/topics/load.dataset.md
@@ -17,11 +17,9 @@ version.
 For example, to load our Chestnut Nature Park dataset. 
 
 ```python
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ```
 
 Then, we can use the `ds` object to load objects of the dataset:
diff --git a/Writerside/topics/preprocessing.extract_segments.md b/Writerside/topics/preprocessing.extract_segments.md
index ed257e8d..a83b3060 100644
--- a/Writerside/topics/preprocessing.extract_segments.md
+++ b/Writerside/topics/preprocessing.extract_segments.md
@@ -135,12 +135,10 @@ Extract segments from bounds and labels.
 
 ```python
 import numpy as np
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.extract_segments import extract_segments_from_bounds
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 
@@ -155,7 +153,7 @@ Extract segments from a label classification.
 from skimage.morphology import remove_small_objects, remove_small_holes
 import numpy as np
 
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.morphology import (
     threshold_binary_mask, binary_watershed
 )
@@ -164,9 +162,7 @@ from frdc.preprocess.extract_segments import (
     extract_segments_from_labels, remove_small_segments_from_labels
 )
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 ar = scale_0_1_per_band(ar)
 ar_mask = threshold_binary_mask(ar, -1, 90 / 256)
diff --git a/Writerside/topics/preprocessing.morphology.md b/Writerside/topics/preprocessing.morphology.md
index 50b5d7b2..95289404 100644
--- a/Writerside/topics/preprocessing.morphology.md
+++ b/Writerside/topics/preprocessing.morphology.md
@@ -29,14 +29,12 @@ classification</b>
 Perform auto-segmentation on a dataset to yield a label classification.
 
 ```python
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.morphology import (
     threshold_binary_mask, binary_watershed
 )
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 mask = threshold_binary_mask(ar, order.index('NIR'), 90 / 256)
 ar_label = binary_watershed(mask)
diff --git a/Writerside/topics/preprocessing.scale.md b/Writerside/topics/preprocessing.scale.md
index 2ce224be..0b0e5946 100644
--- a/Writerside/topics/preprocessing.scale.md
+++ b/Writerside/topics/preprocessing.scale.md
@@ -35,15 +35,13 @@ Take a look at <code>frdc.conf.BAND_MAX_CONFIG</code> for an example.
 ## Usage
 
 ```python
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.scale import (
     scale_0_1_per_band, scale_normal_per_band, scale_static_per_band
 )
 from frdc.conf import BAND_MAX_CONFIG
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 ar_01 = scale_0_1_per_band(ar)
 ar_norm = scale_normal_per_band(ar)
diff --git a/Writerside/writerside.cfg b/Writerside/writerside.cfg
index 39e81f21..9e1b0444 100644
--- a/Writerside/writerside.cfg
+++ b/Writerside/writerside.cfg
@@ -4,5 +4,5 @@
 <ihp version="2.0">
     <topics dir="topics" web-path="topics"/>
     <images dir="images" web-path="images"/>
-    <instance src="d.tree" web-path="/d/" version="0.0.7"/>
+    <instance src="d.tree" web-path="/d/" version="0.0.8"/>
 </ihp>
\ No newline at end of file
diff --git a/docs/HelpTOC.json b/docs/HelpTOC.json
index 54d3f877..5467dd78 100644
--- a/docs/HelpTOC.json
+++ b/docs/HelpTOC.json
@@ -1 +1 @@
-{"entities":{"pages":{"Overview":{"id":"Overview","title":"Overview","url":"overview.html","level":0,"tabIndex":0},"Getting-Started":{"id":"Getting-Started","title":"Getting Started","url":"getting-started.html","level":0,"tabIndex":1},"ae6f1f90_3454":{"id":"ae6f1f90_3454","title":"Tutorials","level":0,"pages":["Retrieve-our-Datasets"],"tabIndex":2},"Retrieve-our-Datasets":{"id":"Retrieve-our-Datasets","title":"Retrieve our Datasets","url":"retrieve-our-datasets.html","level":1,"parentId":"ae6f1f90_3454","tabIndex":0},"mix-match":{"id":"mix-match","title":"MixMatch","url":"mix-match.html","level":0,"pages":["mix-match-module","custom-k-aug-dataloaders"],"tabIndex":3},"mix-match-module":{"id":"mix-match-module","title":"MixMatch Module","url":"mix-match-module.html","level":1,"parentId":"mix-match","tabIndex":0},"custom-k-aug-dataloaders":{"id":"custom-k-aug-dataloaders","title":"Custom K-Aug Dataloaders","url":"custom-k-aug-dataloaders.html","level":1,"parentId":"mix-match","tabIndex":1},"ae6f1f90_3459":{"id":"ae6f1f90_3459","title":"Model Tests","level":0,"pages":["Model-Test-Chestnut-May-Dec"],"tabIndex":4},"Model-Test-Chestnut-May-Dec":{"id":"Model-Test-Chestnut-May-Dec","title":"Model Test Chestnut May-Dec","url":"model-test-chestnut-may-dec.html","level":1,"parentId":"ae6f1f90_3459","tabIndex":0},"ae6f1f90_3461":{"id":"ae6f1f90_3461","title":"API","level":0,"pages":["load.dataset","load.gcs","preprocessing.scale","preprocessing.extract_segments","preprocessing.morphology","preprocessing.glcm_padded","train.frdc_lightning"],"tabIndex":5},"load.dataset":{"id":"load.dataset","title":"load.dataset","url":"load-dataset.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":0},"load.gcs":{"id":"load.gcs","title":"load.gcs","url":"load-gcs.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":1},"preprocessing.scale":{"id":"preprocessing.scale","title":"preprocessing.scale","url":"preprocessing-scale.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":2},"preprocessing.extract_segments":{"id":"preprocessing.extract_segments","title":"preprocessing.extract_segments","url":"preprocessing-extract-segments.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":3},"preprocessing.morphology":{"id":"preprocessing.morphology","title":"preprocessing.morphology","url":"preprocessing-morphology.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":4},"preprocessing.glcm_padded":{"id":"preprocessing.glcm_padded","title":"preprocessing.glcm_padded","url":"preprocessing-glcm-padded.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":5},"train.frdc_lightning":{"id":"train.frdc_lightning","title":"train.frdc_datamodule \u0026 frdc_module","url":"train-frdc-lightning.html","level":1,"parentId":"ae6f1f90_3461","tabIndex":6}}},"topLevelIds":["Overview","Getting-Started","ae6f1f90_3454","mix-match","ae6f1f90_3459","ae6f1f90_3461"]}
\ No newline at end of file
+{"entities":{"pages":{"Overview":{"id":"Overview","title":"Overview","url":"overview.html","level":0,"tabIndex":0},"Getting-Started":{"id":"Getting-Started","title":"Getting Started","url":"getting-started.html","level":0,"pages":["Get-Started-with-Dev-Containers"],"tabIndex":1},"Get-Started-with-Dev-Containers":{"id":"Get-Started-with-Dev-Containers","title":"Get Started with Dev Containers","url":"get-started-with-dev-containers.html","level":1,"parentId":"Getting-Started","tabIndex":0},"f6c570e4_4234":{"id":"f6c570e4_4234","title":"Tutorials","level":0,"pages":["Retrieve-our-Datasets"],"tabIndex":2},"Retrieve-our-Datasets":{"id":"Retrieve-our-Datasets","title":"Retrieve our Datasets","url":"retrieve-our-datasets.html","level":1,"parentId":"f6c570e4_4234","tabIndex":0},"mix-match":{"id":"mix-match","title":"MixMatch","url":"mix-match.html","level":0,"pages":["mix-match-module","custom-k-aug-dataloaders"],"tabIndex":3},"mix-match-module":{"id":"mix-match-module","title":"MixMatch Module","url":"mix-match-module.html","level":1,"parentId":"mix-match","tabIndex":0},"custom-k-aug-dataloaders":{"id":"custom-k-aug-dataloaders","title":"Custom K-Aug Dataloaders","url":"custom-k-aug-dataloaders.html","level":1,"parentId":"mix-match","tabIndex":1},"f6c570e4_4239":{"id":"f6c570e4_4239","title":"Model Tests","level":0,"pages":["Model-Test-Chestnut-May-Dec"],"tabIndex":4},"Model-Test-Chestnut-May-Dec":{"id":"Model-Test-Chestnut-May-Dec","title":"Model Test Chestnut May-Dec","url":"model-test-chestnut-may-dec.html","level":1,"parentId":"f6c570e4_4239","tabIndex":0},"f6c570e4_4241":{"id":"f6c570e4_4241","title":"API","level":0,"pages":["load.dataset","load.gcs","preprocessing.scale","preprocessing.extract_segments","preprocessing.morphology","preprocessing.glcm_padded","train.frdc_lightning"],"tabIndex":5},"load.dataset":{"id":"load.dataset","title":"load.dataset","url":"load-dataset.html","level":1,"parentId":"f6c570e4_4241","tabIndex":0},"load.gcs":{"id":"load.gcs","title":"load.gcs","url":"load-gcs.html","level":1,"parentId":"f6c570e4_4241","tabIndex":1},"preprocessing.scale":{"id":"preprocessing.scale","title":"preprocessing.scale","url":"preprocessing-scale.html","level":1,"parentId":"f6c570e4_4241","tabIndex":2},"preprocessing.extract_segments":{"id":"preprocessing.extract_segments","title":"preprocessing.extract_segments","url":"preprocessing-extract-segments.html","level":1,"parentId":"f6c570e4_4241","tabIndex":3},"preprocessing.morphology":{"id":"preprocessing.morphology","title":"preprocessing.morphology","url":"preprocessing-morphology.html","level":1,"parentId":"f6c570e4_4241","tabIndex":4},"preprocessing.glcm_padded":{"id":"preprocessing.glcm_padded","title":"preprocessing.glcm_padded","url":"preprocessing-glcm-padded.html","level":1,"parentId":"f6c570e4_4241","tabIndex":5},"train.frdc_lightning":{"id":"train.frdc_lightning","title":"train.frdc_datamodule \u0026 frdc_module","url":"train-frdc-lightning.html","level":1,"parentId":"f6c570e4_4241","tabIndex":6}}},"topLevelIds":["Overview","Getting-Started","f6c570e4_4234","mix-match","f6c570e4_4239","f6c570e4_4241"]}
\ No newline at end of file
diff --git a/docs/Map.jhm b/docs/Map.jhm
index 2442fa52..9449faa3 100644
--- a/docs/Map.jhm
+++ b/docs/Map.jhm
@@ -1 +1 @@
-<?xml version='1.0' encoding='UTF-8'?><map version="2.0"><mapID target="Overview.md" url="overview.html" default="yes"/><mapID target="Overview" url="overview.html" default="yes"/><mapID target="Getting-Started.md" url="getting-started.html" default="no"/><mapID target="Getting-Started" url="getting-started.html" default="no"/><mapID target="Retrieve-our-Datasets.md" url="retrieve-our-datasets.html" default="no"/><mapID target="Retrieve-our-Datasets" url="retrieve-our-datasets.html" default="no"/><mapID target="mix-match.md" url="mix-match.html" default="no"/><mapID target="mix-match" url="mix-match.html" default="no"/><mapID target="mix-match-module.md" url="mix-match-module.html" default="no"/><mapID target="mix-match-module" url="mix-match-module.html" default="no"/><mapID target="custom-k-aug-dataloaders.md" url="custom-k-aug-dataloaders.html" default="no"/><mapID target="custom-k-aug-dataloaders" url="custom-k-aug-dataloaders.html" default="no"/><mapID target="Model-Test-Chestnut-May-Dec.md" url="model-test-chestnut-may-dec.html" default="no"/><mapID target="Model-Test-Chestnut-May-Dec" url="model-test-chestnut-may-dec.html" default="no"/><mapID target="load.dataset.md" url="load-dataset.html" default="no"/><mapID target="load.dataset" url="load-dataset.html" default="no"/><mapID target="load.gcs.md" url="load-gcs.html" default="no"/><mapID target="load.gcs" url="load-gcs.html" default="no"/><mapID target="preprocessing.scale.md" url="preprocessing-scale.html" default="no"/><mapID target="preprocessing.scale" url="preprocessing-scale.html" default="no"/><mapID target="preprocessing.extract_segments.md" url="preprocessing-extract-segments.html" default="no"/><mapID target="preprocessing.extract_segments" url="preprocessing-extract-segments.html" default="no"/><mapID target="preprocessing.morphology.md" url="preprocessing-morphology.html" default="no"/><mapID target="preprocessing.morphology" url="preprocessing-morphology.html" default="no"/><mapID target="preprocessing.glcm_padded.md" url="preprocessing-glcm-padded.html" default="no"/><mapID target="preprocessing.glcm_padded" url="preprocessing-glcm-padded.html" default="no"/><mapID target="train.frdc_lightning.md" url="train-frdc-lightning.html" default="no"/><mapID target="train.frdc_lightning" url="train-frdc-lightning.html" default="no"/></map>
\ No newline at end of file
+<?xml version='1.0' encoding='UTF-8'?><map version="2.0"><mapID target="Overview.md" url="overview.html" default="yes"/><mapID target="Overview" url="overview.html" default="yes"/><mapID target="Getting-Started.md" url="getting-started.html" default="no"/><mapID target="Getting-Started" url="getting-started.html" default="no"/><mapID target="Get-Started-with-Dev-Containers.md" url="get-started-with-dev-containers.html" default="no"/><mapID target="Get-Started-with-Dev-Containers" url="get-started-with-dev-containers.html" default="no"/><mapID target="Retrieve-our-Datasets.md" url="retrieve-our-datasets.html" default="no"/><mapID target="Retrieve-our-Datasets" url="retrieve-our-datasets.html" default="no"/><mapID target="mix-match.md" url="mix-match.html" default="no"/><mapID target="mix-match" url="mix-match.html" default="no"/><mapID target="mix-match-module.md" url="mix-match-module.html" default="no"/><mapID target="mix-match-module" url="mix-match-module.html" default="no"/><mapID target="custom-k-aug-dataloaders.md" url="custom-k-aug-dataloaders.html" default="no"/><mapID target="custom-k-aug-dataloaders" url="custom-k-aug-dataloaders.html" default="no"/><mapID target="Model-Test-Chestnut-May-Dec.md" url="model-test-chestnut-may-dec.html" default="no"/><mapID target="Model-Test-Chestnut-May-Dec" url="model-test-chestnut-may-dec.html" default="no"/><mapID target="load.dataset.md" url="load-dataset.html" default="no"/><mapID target="load.dataset" url="load-dataset.html" default="no"/><mapID target="load.gcs.md" url="load-gcs.html" default="no"/><mapID target="load.gcs" url="load-gcs.html" default="no"/><mapID target="preprocessing.scale.md" url="preprocessing-scale.html" default="no"/><mapID target="preprocessing.scale" url="preprocessing-scale.html" default="no"/><mapID target="preprocessing.extract_segments.md" url="preprocessing-extract-segments.html" default="no"/><mapID target="preprocessing.extract_segments" url="preprocessing-extract-segments.html" default="no"/><mapID target="preprocessing.morphology.md" url="preprocessing-morphology.html" default="no"/><mapID target="preprocessing.morphology" url="preprocessing-morphology.html" default="no"/><mapID target="preprocessing.glcm_padded.md" url="preprocessing-glcm-padded.html" default="no"/><mapID target="preprocessing.glcm_padded" url="preprocessing-glcm-padded.html" default="no"/><mapID target="train.frdc_lightning.md" url="train-frdc-lightning.html" default="no"/><mapID target="train.frdc_lightning" url="train-frdc-lightning.html" default="no"/></map>
\ No newline at end of file
diff --git a/docs/config.json b/docs/config.json
index a83934cd..1f05ea18 100644
--- a/docs/config.json
+++ b/docs/config.json
@@ -1 +1 @@
-{"productVersion":"0.0.7","productId":"d","stage":"release","downloadTitle":"Get Documentation","keymaps":{},"searchMaxHits":75,"productName":"Documentation"}
\ No newline at end of file
+{"productVersion":"0.0.8","productId":"d","stage":"release","downloadTitle":"Get Documentation","keymaps":{},"searchMaxHits":75,"productName":"Documentation"}
\ No newline at end of file
diff --git a/docs/current.help.version b/docs/current.help.version
index 5c4511c3..7d6b3eb3 100644
--- a/docs/current.help.version
+++ b/docs/current.help.version
@@ -1 +1 @@
-0.0.7
\ No newline at end of file
+0.0.8
\ No newline at end of file
diff --git a/docs/custom-k-aug-dataloaders.html b/docs/custom-k-aug-dataloaders.html
index f3bc78b7..473d540d 100644
--- a/docs/custom-k-aug-dataloaders.html
+++ b/docs/custom-k-aug-dataloaders.html
@@ -1,4 +1,4 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0968833"><meta name="build-number" content="${buildNumber}">       <title>Custom K-Aug Dataloaders | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"loading-multiple-augmented-versions-of-the-same-image","level":0,"title":"Loading Multiple Augmented Versions of the Same Image","anchor":"#loading-multiple-augmented-versions-of-the-same-image"},{"id":"premature-end-of-epoch-due-to-small-labelled-set","level":0,"title":"Premature End of Epoch due to Small Labelled Set","anchor":"#premature-end-of-epoch-due-to-small-labelled-set"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Custom K-Aug Dataloaders | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/custom-k-aug-dataloaders.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Custom K-Aug Dataloaders | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/custom-k-aug-dataloaders.html#webpage", "url": "/d/0.0.7/custom-k-aug-dataloaders.html", "name": "Custom K-Aug Dataloaders | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="custom-k-aug-dataloaders" data-main-title="Custom K-Aug Dataloaders" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="mix-match.md|MixMatch"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="custom-k-aug-dataloaders"   id="custom-k-aug-dataloaders.md">Custom K-Aug Dataloaders</h1>  <p id="943bd38_133">In MixMatch, implementing the data loading methods is quite unconventional.</p><ol class="list _decimal" id="943bd38_134" type="1"><li class="list__item" id="943bd38_135"><p>We need to load multiple augmented versions of the same image into the same batch.</p></li><li class="list__item" id="943bd38_136"><p>The labelled set is usually too small, causing a premature end to the epoch as it runs out of samples to draw from faster than the unlabelled set.</p></li></ol><p id="943bd38_137">This can be rather tricky to implement in PyTorch. This tutorial will illustrate how we did it.</p><section class="chapter"><h2 id="loading-multiple-augmented-versions-of-the-same-image" data-toc="loading-multiple-augmented-versions-of-the-same-image"   >Loading Multiple Augmented Versions of the Same Image</h2><p id="943bd38_138">See: <code class="code" id="943bd38_139">frdc/load/dataset.py</code> <code class="code" id="943bd38_140">FRDCDataset.__getitem__</code></p><p id="943bd38_141">In MixMatch, a single train batch must consist of:</p><ol class="list _decimal" id="943bd38_142" type="1"><li class="list__item" id="943bd38_143"><p>A batch of labeled images</p></li><li class="list__item" id="943bd38_144"><p>K batches of unlabeled images</p></li></ol><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 518.203125 302"  xmlns="http://www.w3.org/2000/svg" width="518.203125" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M56.874627976190474,84L65.92677331349206,72.83333333333333C74.97891865079366,61.666666666666664,93.08320932539682,39.333333333333336,117.73952132936508,28.166666666666668C142.39583333333334,17,173.60416666666666,17,206.99739583333334,17C240.390625,17,275.96875,17,300.109375,17C324.25,17,336.953125,17,343.3046875,17L349.65625,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-C" id="L-A-C-0" d="M56.874627976190474,118L65.92677331349206,129.16666666666666C74.97891865079366,140.33333333333334,93.08320932539682,162.66666666666666,106.30202132936508,173.83333333333334C119.52083333333333,185,127.85416666666667,185,132.02083333333334,185L136.1875,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M226.41350446428572,168L240.60239955357144,156.83333333333334C254.79129464285714,145.66666666666666,283.1690848214286,123.33333333333333,305.23428199404765,112.16666666666667C327.2994791666667,101,343.0520833333333,101,350.9283854166667,101L358.8046875,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-E" id="L-C-E-0" d="M273.4375,185L279.7890625,185C286.140625,185,298.84375,185,313.390625,185C327.9375,185,344.328125,185,352.5234375,185L360.71875,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-F" id="L-C-F-0" d="M226.41350446428572,202L240.60239955357144,213.16666666666666C254.79129464285714,224.33333333333334,283.1690848214286,246.66666666666666,305.1665736607143,257.8333333333333C327.1640625,269,342.78125,269,350.58984375,269L358.3984375,269"></path></g><g class="edgeLabels"><g transform="translate(204.8125, 17)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g transform="translate(311.546875, 101)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(311.546875, 185)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(311.546875, 269)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(43.09375, 101)" id="flowchart-A-86" class="node default default flowchart-label"><rect height="34" width="86.1875" y="-17" x="-43.09375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-35.59375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="71.1875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Get Batch</span></div></foreignObject></g></g><g transform="translate(425.9296875, 17)" id="flowchart-B-87" class="node default default flowchart-label"><rect height="34" width="152.546875" y="-17" x="-76.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-68.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="137.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Labelled Batch</span></div></foreignObject></g></g><g transform="translate(204.8125, 185)" id="flowchart-C-89" class="node default default flowchart-label"><rect height="34" width="137.25" y="-17" x="-68.625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-61.125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="122.25"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Unlabelled Batch</span></div></foreignObject></g></g><g transform="translate(425.9296875, 101)" id="flowchart-D-91" class="node default default flowchart-label"><rect height="34" width="134.25" y="-17" x="-67.125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-59.625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="119.25"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Unl. Batch 1</span></div></foreignObject></g></g><g transform="translate(425.9296875, 185)" id="flowchart-E-93" class="node default default flowchart-label"><rect height="34" width="130.421875" y="-17" x="-65.2109375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-57.7109375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="115.421875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Unl. Batch i</span></div></foreignObject></g></g><g transform="translate(425.9296875, 269)" id="flowchart-F-95" class="node default default flowchart-label"><rect height="34" width="135.0625" y="-17" x="-67.53125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-60.03125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="120.0625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Unl. Batch K</span></div></foreignObject></g></g></g></g></g></svg><p id="943bd38_146">Keep in mind that the unlabelled batch, is a single batch of images, not separate draws of batches. It is then &quot;duplicated&quot; K times, and each copy is augmented differently.</p><section class="chapter"><h3 id="solution-1-custom-dataset" data-toc="solution-1-custom-dataset"   >Solution 1: Custom Dataset</h3><p id="943bd38_147">To solve this, we need to understand the role of both a <a href="https://pytorch.org/docs/stable/data.html#torch.utils.data.Dataset" id="943bd38_148"   data-external="true" rel="noopener noreferrer" >Dataset</a> and a <a href="https://pytorch.org/docs/stable/data.html#torch.utils.data.DataLoader" id="943bd38_149"   data-external="true" rel="noopener noreferrer" >DataLoader</a>.</p><ul class="list _ul" id="943bd38_150"><li class="list__item" id="943bd38_151"><p>A <code class="code" id="943bd38_152">Dataset</code> represents a collection of data, responsible for loading and returning something.</p></li><li class="list__item" id="943bd38_153"><p>A <code class="code" id="943bd38_154">DataLoader</code> draws samples from a Dataset and returns batched samples.</p></li></ul><p id="943bd38_155">The key here is that a <code class="code" id="943bd38_156">Dataset</code> is not limited to returning 1 sample at a time, we can make it return the K augmented versions of the same image.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 270.78125 218"  xmlns="http://www.w3.org/2000/svg" width="270.78125" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M47.84207589285714,84L57.34495907738094,72.83333333333333C66.84784226190476,61.666666666666664,85.85360863095237,39.333333333333336,101.77706473214285,28.166666666666668C117.70052083333333,17,130.54166666666666,17,136.96223958333334,17L143.3828125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-C" id="L-A-C-0" d="M66.75,101L73.1015625,101C79.453125,101,92.15625,101,105.24739583333333,101C118.33854166666667,101,131.81770833333334,101,138.55729166666666,101L145.296875,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-D" id="L-A-D-0" d="M47.84207589285714,118L57.34495907738094,129.16666666666666C66.84784226190476,140.33333333333334,85.85360863095237,162.66666666666666,101.70805431547619,173.83333333333334C117.5625,185,130.265625,185,136.6171875,185L142.96875,185"></path></g><g class="edgeLabels"><g transform="translate(104.859375, 17)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(104.859375, 101)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(104.859375, 185)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(33.375, 101)" id="flowchart-A-144" class="node default default flowchart-label"><rect height="34" width="66.75" y="-17" x="-33.375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-25.875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="51.75"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Sample</span></div></foreignObject></g></g><g transform="translate(198.875, 17)" id="flowchart-B-145" class="node default default flowchart-label"><rect height="34" width="110.984375" y="-17" x="-55.4921875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.9921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="95.984375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Sample 1</span></div></foreignObject></g></g><g transform="translate(198.875, 101)" id="flowchart-C-147" class="node default default flowchart-label"><rect height="34" width="107.15625" y="-17" x="-53.578125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-46.078125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="92.15625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Sample i</span></div></foreignObject></g></g><g transform="translate(198.875, 185)" id="flowchart-D-149" class="node default default flowchart-label"><rect height="34" width="111.8125" y="-17" x="-55.90625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-48.40625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="96.8125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Sample K</span></div></foreignObject></g></g></g></g></g></svg><p id="943bd38_158">In code, this is done by subclassing the <code class="code" id="943bd38_159">Dataset</code> class and overriding the <code class="code" id="943bd38_160">__getitem__</code> method.</p><div class="code-block" data-lang="python"         >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>Custom K-Aug Dataloaders | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"loading-multiple-augmented-versions-of-the-same-image","level":0,"title":"Loading Multiple Augmented Versions of the Same Image","anchor":"#loading-multiple-augmented-versions-of-the-same-image"},{"id":"premature-end-of-epoch-due-to-small-labelled-set","level":0,"title":"Premature End of Epoch due to Small Labelled Set","anchor":"#premature-end-of-epoch-due-to-small-labelled-set"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Custom K-Aug Dataloaders | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/custom-k-aug-dataloaders.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Custom K-Aug Dataloaders | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/custom-k-aug-dataloaders.html#webpage", "url": "/d/0.0.8/custom-k-aug-dataloaders.html", "name": "Custom K-Aug Dataloaders | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="custom-k-aug-dataloaders" data-main-title="Custom K-Aug Dataloaders" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="mix-match.md|MixMatch"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="custom-k-aug-dataloaders"   id="custom-k-aug-dataloaders.md">Custom K-Aug Dataloaders</h1>  <p id="7ba6156c_186">In MixMatch, implementing the data loading methods is quite unconventional.</p><ol class="list _decimal" id="7ba6156c_187" type="1"><li class="list__item" id="7ba6156c_188"><p>We need to load multiple augmented versions of the same image into the same batch.</p></li><li class="list__item" id="7ba6156c_189"><p>The labelled set is usually too small, causing a premature end to the epoch as it runs out of samples to draw from faster than the unlabelled set.</p></li></ol><p id="7ba6156c_190">This can be rather tricky to implement in PyTorch. This tutorial will illustrate how we did it.</p><section class="chapter"><h2 id="loading-multiple-augmented-versions-of-the-same-image" data-toc="loading-multiple-augmented-versions-of-the-same-image"   >Loading Multiple Augmented Versions of the Same Image</h2><p id="7ba6156c_191">See: <code class="code" id="7ba6156c_192">frdc/load/dataset.py</code> <code class="code" id="7ba6156c_193">FRDCDataset.__getitem__</code></p><p id="7ba6156c_194">In MixMatch, a single train batch must consist of:</p><ol class="list _decimal" id="7ba6156c_195" type="1"><li class="list__item" id="7ba6156c_196"><p>A batch of labeled images</p></li><li class="list__item" id="7ba6156c_197"><p>K batches of unlabeled images</p></li></ol><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 518.203125 302"  xmlns="http://www.w3.org/2000/svg" width="518.203125" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M56.874627976190474,84L65.92677331349206,72.83333333333333C74.97891865079366,61.666666666666664,93.08320932539682,39.333333333333336,117.73952132936508,28.166666666666668C142.39583333333334,17,173.60416666666666,17,206.99739583333334,17C240.390625,17,275.96875,17,300.109375,17C324.25,17,336.953125,17,343.3046875,17L349.65625,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-C" id="L-A-C-0" d="M56.874627976190474,118L65.92677331349206,129.16666666666666C74.97891865079366,140.33333333333334,93.08320932539682,162.66666666666666,106.30202132936508,173.83333333333334C119.52083333333333,185,127.85416666666667,185,132.02083333333334,185L136.1875,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M226.41350446428572,168L240.60239955357144,156.83333333333334C254.79129464285714,145.66666666666666,283.1690848214286,123.33333333333333,305.23428199404765,112.16666666666667C327.2994791666667,101,343.0520833333333,101,350.9283854166667,101L358.8046875,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-E" id="L-C-E-0" d="M273.4375,185L279.7890625,185C286.140625,185,298.84375,185,313.390625,185C327.9375,185,344.328125,185,352.5234375,185L360.71875,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-F" id="L-C-F-0" d="M226.41350446428572,202L240.60239955357144,213.16666666666666C254.79129464285714,224.33333333333334,283.1690848214286,246.66666666666666,305.1665736607143,257.8333333333333C327.1640625,269,342.78125,269,350.58984375,269L358.3984375,269"></path></g><g class="edgeLabels"><g transform="translate(204.8125, 17)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g transform="translate(311.546875, 101)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(311.546875, 185)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(311.546875, 269)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(43.09375, 101)" id="flowchart-A-92" class="node default default flowchart-label"><rect height="34" width="86.1875" y="-17" x="-43.09375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-35.59375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="71.1875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Get Batch</span></div></foreignObject></g></g><g transform="translate(425.9296875, 17)" id="flowchart-B-93" class="node default default flowchart-label"><rect height="34" width="152.546875" y="-17" x="-76.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-68.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="137.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Labelled Batch</span></div></foreignObject></g></g><g transform="translate(204.8125, 185)" id="flowchart-C-95" class="node default default flowchart-label"><rect height="34" width="137.25" y="-17" x="-68.625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-61.125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="122.25"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Unlabelled Batch</span></div></foreignObject></g></g><g transform="translate(425.9296875, 101)" id="flowchart-D-97" class="node default default flowchart-label"><rect height="34" width="134.25" y="-17" x="-67.125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-59.625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="119.25"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Unl. Batch 1</span></div></foreignObject></g></g><g transform="translate(425.9296875, 185)" id="flowchart-E-99" class="node default default flowchart-label"><rect height="34" width="130.421875" y="-17" x="-65.2109375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-57.7109375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="115.421875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Unl. Batch i</span></div></foreignObject></g></g><g transform="translate(425.9296875, 269)" id="flowchart-F-101" class="node default default flowchart-label"><rect height="34" width="135.0625" y="-17" x="-67.53125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-60.03125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="120.0625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Unl. Batch K</span></div></foreignObject></g></g></g></g></g></svg><p id="7ba6156c_199">Keep in mind that the unlabelled batch, is a single batch of images, not separate draws of batches. It is then &quot;duplicated&quot; K times, and each copy is augmented differently.</p><section class="chapter"><h3 id="solution-1-custom-dataset" data-toc="solution-1-custom-dataset"   >Solution 1: Custom Dataset</h3><p id="7ba6156c_200">To solve this, we need to understand the role of both a <a href="https://pytorch.org/docs/stable/data.html#torch.utils.data.Dataset" id="7ba6156c_201"   data-external="true" rel="noopener noreferrer" >Dataset</a> and a <a href="https://pytorch.org/docs/stable/data.html#torch.utils.data.DataLoader" id="7ba6156c_202"   data-external="true" rel="noopener noreferrer" >DataLoader</a>.</p><ul class="list _ul" id="7ba6156c_203"><li class="list__item" id="7ba6156c_204"><p>A <code class="code" id="7ba6156c_205">Dataset</code> represents a collection of data, responsible for loading and returning something.</p></li><li class="list__item" id="7ba6156c_206"><p>A <code class="code" id="7ba6156c_207">DataLoader</code> draws samples from a Dataset and returns batched samples.</p></li></ul><p id="7ba6156c_208">The key here is that a <code class="code" id="7ba6156c_209">Dataset</code> is not limited to returning 1 sample at a time, we can make it return the K augmented versions of the same image.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 270.78125 218"  xmlns="http://www.w3.org/2000/svg" width="270.78125" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M47.84207589285714,84L57.34495907738094,72.83333333333333C66.84784226190476,61.666666666666664,85.85360863095237,39.333333333333336,101.77706473214285,28.166666666666668C117.70052083333333,17,130.54166666666666,17,136.96223958333334,17L143.3828125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-C" id="L-A-C-0" d="M66.75,101L73.1015625,101C79.453125,101,92.15625,101,105.24739583333333,101C118.33854166666667,101,131.81770833333334,101,138.55729166666666,101L145.296875,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-D" id="L-A-D-0" d="M47.84207589285714,118L57.34495907738094,129.16666666666666C66.84784226190476,140.33333333333334,85.85360863095237,162.66666666666666,101.70805431547619,173.83333333333334C117.5625,185,130.265625,185,136.6171875,185L142.96875,185"></path></g><g class="edgeLabels"><g transform="translate(104.859375, 17)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(104.859375, 101)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g><g transform="translate(104.859375, 185)" class="edgeLabel"><g transform="translate(-13.109375, -9.5)" class="label"><foreignObject height="19" width="26.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Aug</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(33.375, 101)" id="flowchart-A-150" class="node default default flowchart-label"><rect height="34" width="66.75" y="-17" x="-33.375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-25.875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="51.75"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Sample</span></div></foreignObject></g></g><g transform="translate(198.875, 17)" id="flowchart-B-151" class="node default default flowchart-label"><rect height="34" width="110.984375" y="-17" x="-55.4921875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.9921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="95.984375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Sample 1</span></div></foreignObject></g></g><g transform="translate(198.875, 101)" id="flowchart-C-153" class="node default default flowchart-label"><rect height="34" width="107.15625" y="-17" x="-53.578125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-46.078125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="92.15625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Sample i</span></div></foreignObject></g></g><g transform="translate(198.875, 185)" id="flowchart-D-155" class="node default default flowchart-label"><rect height="34" width="111.8125" y="-17" x="-55.90625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-48.40625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="96.8125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Aug Sample K</span></div></foreignObject></g></g></g></g></g></svg><p id="7ba6156c_211">In code, this is done by subclassing the <code class="code" id="7ba6156c_212">Dataset</code> class and overriding the <code class="code" id="7ba6156c_213">__getitem__</code> method.</p><div class="code-block" data-lang="python"         >
 def duplicate(x):
     return x, deepcopy(x), deepcopy(x)
 
@@ -10,7 +10,7 @@
     def __getitem__(self, index):
         x, y = self.dataset[index]
         return self.aug(x), y
-</div><p id="943bd38_162">In the above example, we have a <code class="code" id="943bd38_163">Dataset</code> that returns 3 duplicate versions of the same image. By leveraging this technique, we can create a <code class="code" id="943bd38_164">Dataset</code> that returns K augmented versions of the same image as a tuple</p></section></section><section class="chapter"><h2 id="premature-end-of-epoch-due-to-small-labelled-set" data-toc="premature-end-of-epoch-due-to-small-labelled-set"   >Premature End of Epoch due to Small Labelled Set</h2><p id="943bd38_165">See: <code class="code" id="943bd38_166">frdc/train/frdc_datamodule.py</code></p><p id="943bd38_167">In MixMatch, the definition of an &quot;epoch&quot; is a bit different. Instead of implying that we have seen all the data once, it implies that we've drawn <code class="code" id="943bd38_168">N</code> batches. The <code class="code" id="943bd38_169">N</code> is referred to as the number of iterations per epoch.</p><p id="943bd38_170">Take for example, a labelled set of numbers [1, 2, 3] and an unlabelled set [4, 5, 6, 7, 8, 9, 10]. With batch size of 2, we'll run out of labelled samples after 2 iterations, but we'll still have 3 more iterations for the unlabelled set.</p><ul class="list _ul" id="943bd38_171"><li class="list__item" id="943bd38_172"><p>Draw 1: [1, 2], [4, 5]</p></li><li class="list__item" id="943bd38_173"><p>Draw 2: [3], [6, 7].</p></li><li class="list__item" id="943bd38_174"><p>Epoch ends.</p></li></ul><section class="chapter"><h3 id="solution-2-random-sampling" data-toc="solution-2-random-sampling"   >Solution 2: Random Sampling</h3><p id="943bd38_175">To fix this, instead of sequentially sampling the labelled set (and the unlabelled set), we can sample them randomly. This way, we can ensure that it never runs out.</p><ul class="list _ul" id="943bd38_176"><li class="list__item" id="943bd38_177"><p>Draw 1: [1, 3], [7, 5]</p></li><li class="list__item" id="943bd38_178"><p>Draw 2: [2, 1], [4, 9]</p></li><li class="list__item" id="943bd38_179"><p>Draw 3: [3, 2], [8, 6]</p></li><li class="list__item" id="943bd38_180"><p>... and so on.</p></li></ul><p id="943bd38_181">Luckily, PyTorch's <code class="code" id="943bd38_182">DataLoader</code> supports random sampling. We just need to use <code class="code" id="943bd38_183">RandomSampler</code> instead of <code class="code" id="943bd38_184">SequentialSampler</code> (which is the default).</p><div class="code-block" data-lang="python"         >
+</div><p id="7ba6156c_215">In the above example, we have a <code class="code" id="7ba6156c_216">Dataset</code> that returns 3 duplicate versions of the same image. By leveraging this technique, we can create a <code class="code" id="7ba6156c_217">Dataset</code> that returns K augmented versions of the same image as a tuple</p></section></section><section class="chapter"><h2 id="premature-end-of-epoch-due-to-small-labelled-set" data-toc="premature-end-of-epoch-due-to-small-labelled-set"   >Premature End of Epoch due to Small Labelled Set</h2><p id="7ba6156c_218">See: <code class="code" id="7ba6156c_219">frdc/train/frdc_datamodule.py</code></p><p id="7ba6156c_220">In MixMatch, the definition of an &quot;epoch&quot; is a bit different. Instead of implying that we have seen all the data once, it implies that we've drawn <code class="code" id="7ba6156c_221">N</code> batches. The <code class="code" id="7ba6156c_222">N</code> is referred to as the number of iterations per epoch.</p><p id="7ba6156c_223">Take for example, a labelled set of numbers [1, 2, 3] and an unlabelled set [4, 5, 6, 7, 8, 9, 10]. With batch size of 2, we'll run out of labelled samples after 2 iterations, but we'll still have 3 more iterations for the unlabelled set.</p><ul class="list _ul" id="7ba6156c_224"><li class="list__item" id="7ba6156c_225"><p>Draw 1: [1, 2], [4, 5]</p></li><li class="list__item" id="7ba6156c_226"><p>Draw 2: [3], [6, 7].</p></li><li class="list__item" id="7ba6156c_227"><p>Epoch ends.</p></li></ul><section class="chapter"><h3 id="solution-2-random-sampling" data-toc="solution-2-random-sampling"   >Solution 2: Random Sampling</h3><p id="7ba6156c_228">To fix this, instead of sequentially sampling the labelled set (and the unlabelled set), we can sample them randomly. This way, we can ensure that it never runs out.</p><ul class="list _ul" id="7ba6156c_229"><li class="list__item" id="7ba6156c_230"><p>Draw 1: [1, 3], [7, 5]</p></li><li class="list__item" id="7ba6156c_231"><p>Draw 2: [2, 1], [4, 9]</p></li><li class="list__item" id="7ba6156c_232"><p>Draw 3: [3, 2], [8, 6]</p></li><li class="list__item" id="7ba6156c_233"><p>... and so on.</p></li></ul><p id="7ba6156c_234">Luckily, PyTorch's <code class="code" id="7ba6156c_235">DataLoader</code> supports random sampling. We just need to use <code class="code" id="7ba6156c_236">RandomSampler</code> instead of <code class="code" id="7ba6156c_237">SequentialSampler</code> (which is the default).</p><div class="code-block" data-lang="python"         >
 from torch.utils.data import DataLoader, RandomSampler
 
 dl = DataLoader(
@@ -21,4 +21,4 @@
         replacement=False,
     )
 )
-</div><p id="943bd38_186">This will ensure that the &quot;epoch&quot; ends when we've drawn <code class="code" id="943bd38_187">train_iters</code> batches</p></section></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="mix-match-module.html">MixMatch Module</a>   <a class="navigation-links__next" href="model-test-chestnut-may-dec.html">Model Test Chestnut May-Dec</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><p id="7ba6156c_239">This will ensure that the &quot;epoch&quot; ends when we've drawn <code class="code" id="7ba6156c_240">train_iters</code> batches</p></section></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="mix-match-module.html">MixMatch Module</a>   <a class="navigation-links__next" href="model-test-chestnut-may-dec.html">Model Test Chestnut May-Dec</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/get-started-with-dev-containers.html b/docs/get-started-with-dev-containers.html
new file mode 100644
index 00000000..be7dc455
--- /dev/null
+++ b/docs/get-started-with-dev-containers.html
@@ -0,0 +1,3 @@
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>Get Started with Dev Containers | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"python-environment","level":0,"title":"Python Environment","anchor":"#python-environment"},{"id":"mark-as-sources-root-add-to-pythonpath","level":0,"title":"Mark as Sources Root (Add to PYTHONPATH)","anchor":"#mark-as-sources-root-add-to-pythonpath"},{"id":"additional-setup","level":0,"title":"Additional Setup","anchor":"#additional-setup"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Get Started with Dev Containers | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/get-started-with-dev-containers.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Get Started with Dev Containers | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/get-started-with-dev-containers.html#webpage", "url": "/d/0.0.8/get-started-with-dev-containers.html", "name": "Get Started with Dev Containers | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Get-Started-with-Dev-Containers" data-main-title="Get Started with Dev Containers" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="Getting-Started.md|Getting Started"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Get-Started-with-Dev-Containers"   id="Get-Started-with-Dev-Containers.md">Get Started with Dev Containers</h1>  <p id="8701bc38_191">Dev. Containers are a great way to get started with a project. They define all necessary dependencies and environments, so you can just start coding within the container.</p><p id="8701bc38_192">In this article, we'll only go over <span class="control" id="8701bc38_193">additional steps</span> to set up with our project. For more information on how to use Dev Containers, please refer to the official documentation for each IDE. Once you've set up the Dev Container, come back here to finish the setup:</p><ul class="list _ul" id="8701bc38_194"><li class="list__item" id="8701bc38_195"><p><a href="https://code.visualstudio.com/docs/remote/containers" id="8701bc38_196"   data-external="true" rel="noopener noreferrer" >VSCode</a>.</p></li><li class="list__item" id="8701bc38_197"><p><a href="https://www.jetbrains.com/help/idea/connect-to-devcontainer.html" id="8701bc38_198"   data-external="true" rel="noopener noreferrer" >IntelliJ</a></p></li></ul><aside class="prompt" data-type="warning" data-title="" id="8701bc38_199"><p id="8701bc38_200">If you see the error <code class="code" id="8701bc38_201">Error response from daemon: ... &lt;!DOCTYPE</code>, you forgot the <code class="code" id="8701bc38_202">.git</code> at the end of the repo URL.</p></aside><section class="chapter"><h2 id="python-environment" data-toc="python-environment"   >Python Environment</h2><aside class="prompt" data-type="warning" data-title="" id="8701bc38_203"><p id="8701bc38_204">Do not create a new environment</p></aside><p id="8701bc38_205">The dev environment is already created and is managed by Anaconda <code class="code" id="8701bc38_206">/opt/conda/bin/conda</code>. To activate the environment, run the following command:</p><div class="code-block" data-lang="bash"         >
+conda activate base
+</div><aside class="prompt" data-type="tip" data-title="" id="8701bc38_208"><p id="8701bc38_209">Refer to your respective IDE's documentation on how to activate the environment.</p></aside></section><section class="chapter"><h2 id="mark-as-sources-root-add-to-pythonpath" data-toc="mark-as-sources-root-add-to-pythonpath"   >Mark as Sources Root (Add to PYTHONPATH)</h2><p id="8701bc38_210">For <code class="code" id="8701bc38_211">import</code> statements to work, you need to mark the <code class="code" id="8701bc38_212">src</code> folder as the sources root. Optionally, also mark the <code class="code" id="8701bc38_213">tests</code> folder as the tests root.</p><aside class="prompt" data-type="tip" data-title="" id="8701bc38_214"><p id="8701bc38_215">Refer to your respective IDE's documentation on how to mark folders as sources root. (Also known as adding to the <code class="code" id="8701bc38_216">PYTHONPATH</code>)</p></aside></section><section class="chapter"><h2 id="additional-setup" data-toc="additional-setup"   >Additional Setup</h2><p id="8701bc38_217">Refer to the <a href="getting-started.html" id="8701bc38_218" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Getting Started</a> guide for additional setup steps such as:</p><ul class="list _ul" id="8701bc38_219"><li class="list__item" id="8701bc38_220"><p>Google Cloud Application Default Credentials</p></li><li class="list__item" id="8701bc38_221"><p>Weight &amp; Bias API Key</p></li><li class="list__item" id="8701bc38_222"><p>Label Studio API Key</p></li></ul></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="getting-started.html">Getting Started</a>   <a class="navigation-links__next" href="retrieve-our-datasets.html">Retrieve our Datasets</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/getting-started.html b/docs/getting-started.html
index 172d307d..8bc4700d 100644
--- a/docs/getting-started.html
+++ b/docs/getting-started.html
@@ -1,20 +1,22 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0998842"><meta name="build-number" content="${buildNumber}">       <title>Getting Started | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"our-repository-structure","level":0,"title":"Our Repository Structure","anchor":"#our-repository-structure"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Getting Started | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/getting-started.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Getting Started | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/getting-started.html#webpage", "url": "/d/0.0.7/getting-started.html", "name": "Getting Started | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Getting-Started" data-main-title="Getting Started" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs=""  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Getting-Started"   id="Getting-Started.md">Getting Started</h1>  <section class="procedure-steps"   ><h3 id="install" data-toc="install">Installing the Dev. Environment</h3 ><ol class="list _decimal"><li class="list__item" id="ee0d787c_13755"><p>Ensure that you have the right version of Python. The required Python version can be seen in <code class="code" id="ee0d787c_13756">pyproject.toml</code></p><div class="code-block" data-lang="ini"         >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3942757"><meta name="build-number" content="${buildNumber}">       <title>Getting Started | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"troubleshooting","level":0,"title":"Troubleshooting","anchor":"#troubleshooting"},{"id":"our-repository-structure","level":0,"title":"Our Repository Structure","anchor":"#our-repository-structure"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Getting Started | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/getting-started.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Getting Started | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/getting-started.html#webpage", "url": "/d/0.0.8/getting-started.html", "name": "Getting Started | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Getting-Started" data-main-title="Getting Started" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs=""  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Getting-Started"   id="Getting-Started.md">Getting Started</h1>  <aside class="prompt" data-type="tip" data-title="" id="22521d46_3385"><p id="22521d46_3386">Want to use a Dev Container? See <a href="get-started-with-dev-containers.html" id="22521d46_3387" data-tooltip="Dev. Containers are a great way to get started with a project. They define all necessary dependencies and environments, so you can just start coding within the container."  >Get Started with Dev Containers</a></p></aside><section class="procedure-steps"   ><h3 id="install" data-toc="install">Installing the Dev. Environment</h3 ><ol class="list _decimal"><li class="list__item" id="22521d46_3388"><p>Ensure that you have the right version of Python. The required Python version can be seen in <code class="code" id="22521d46_3389">pyproject.toml</code></p><div class="code-block" data-lang="ini"         >
             [tool.poetry.dependencies]
             python = &quot;...&quot;
-        </div></li><li class="list__item" id="ee0d787c_13758"><p>Start by cloning our repository. </p><div class="code-block" data-lang="bash"         >
-          git clone https://github.com/Forest-Recovery-Digital-Companion/FRDC-ML.git
-        </div></li><li class="list__item" id="ee0d787c_13760"><p>Then, create a Python Virtual Env <code class="code" id="ee0d787c_13761">pyvenv</code></p><div class="tabs" id="ee0d787c_13762"><div class="tabs__content" data-gtm="tab" id="ee0d787c_13763" data-title="Windows"><div class="code-block" data-lang="bash"    data-title="Shell"     >python -m venv venv/</div></div><div class="tabs__content" data-gtm="tab" id="ee0d787c_13765" data-title="Linux"><div class="code-block" data-lang="bash"    data-title="Shell"     >python3 -m venv venv/</div></div></div></li><li class="list__item" id="ee0d787c_13767"><p><a href="https://python-poetry.org/docs/" id="ee0d787c_13768"   data-external="true" rel="noopener noreferrer" >Install Poetry</a> Then check if it's installed with </p><div class="code-block" data-lang="bash"         >poetry --version</div><aside class="prompt" data-type="warning" data-title="" id="ee0d787c_13770"><p>If <code class="code" id="ee0d787c_13771">poetry</code> is not found, it's likely not in the user PATH.</p></aside></li><li class="list__item" id="ee0d787c_13772"><p>Activate the virtual environment </p><div class="tabs" id="ee0d787c_13773"><div class="tabs__content" data-gtm="tab" id="ee0d787c_13774" data-title="Windows"><div class="code-block" data-lang="bash"    data-title="Shell"     >
+        </div></li><li class="list__item" id="22521d46_3391"><p>Start by cloning our repository. </p><div class="code-block" data-lang="bash"         >
+          git clone https://github.com/FR-DC/FRDC-ML.git
+        </div></li><li class="list__item" id="22521d46_3393"><p>Then, create a Python Virtual Env <code class="code" id="22521d46_3394">pyvenv</code></p><div class="tabs" id="22521d46_3395"><div class="tabs__content" data-gtm="tab" id="22521d46_3396" data-title="Windows"><div class="code-block" data-lang="bash"    data-title="Shell"     >python -m venv venv/</div></div><div class="tabs__content" data-gtm="tab" id="22521d46_3398" data-title="Linux"><div class="code-block" data-lang="bash"    data-title="Shell"     >python3 -m venv venv/</div></div></div></li><li class="list__item" id="22521d46_3400"><p><a href="https://python-poetry.org/docs/" id="22521d46_3401"   data-external="true" rel="noopener noreferrer" >Install Poetry</a> Then check if it's installed with </p><div class="code-block" data-lang="bash"         >poetry --version</div><aside class="prompt" data-type="warning" data-title="" id="22521d46_3403"><p>If <code class="code" id="22521d46_3404">poetry</code> is not found, it's likely not in the user PATH.</p></aside></li><li class="list__item" id="22521d46_3405"><p>Activate the virtual environment </p><div class="tabs" id="22521d46_3406"><div class="tabs__content" data-gtm="tab" id="22521d46_3407" data-title="Windows"><div class="code-block" data-lang="bash"    data-title="Shell"     >
             cd venv/Scripts
             activate
             cd ../..
-        </div></div><div class="tabs__content" data-gtm="tab" id="ee0d787c_13776" data-title="Linux"><div class="code-block" data-lang="bash"    data-title="Shell"     >
+        </div></div><div class="tabs__content" data-gtm="tab" id="22521d46_3409" data-title="Linux"><div class="code-block" data-lang="bash"    data-title="Shell"     >
             source venv/bin/activate
-        </div></div></div></li><li class="list__item" id="ee0d787c_13778"><p>Install the dependencies. You should be in the same directory as <code class="code" id="ee0d787c_13779">pyproject.toml</code></p><div class="code-block" data-lang="bash"         >
+        </div></div></div></li><li class="list__item" id="22521d46_3411"><p>Install the dependencies. You should be in the same directory as <code class="code" id="22521d46_3412">pyproject.toml</code></p><div class="code-block" data-lang="bash"         >
             poetry install --with dev
-        </div></li><li class="list__item" id="ee0d787c_13781"><p>Install Pre-Commit Hooks </p><div class="code-block" data-lang="bash"         >
+        </div></li><li class="list__item" id="22521d46_3414"><p>Install Pre-Commit Hooks </p><div class="code-block" data-lang="bash"         >
             pre-commit install
-        </div></li></ol></section><section class="procedure-steps"   ><h3 id="gcloud" data-toc="gcloud">Setting Up Google Cloud</h3 ><ol class="list _decimal"><li class="list__item" id="ee0d787c_13783"><p>We use Google Cloud to store our datasets. To set up Google Cloud, <a href="https://cloud.google.com/sdk/docs/install" id="ee0d787c_13784"   data-external="true" rel="noopener noreferrer" >install the Google Cloud CLI</a></p></li><li class="list__item" id="ee0d787c_13785"><p>Then, <a href="https://cloud.google.com/sdk/docs/initializing" id="ee0d787c_13786"   data-external="true" rel="noopener noreferrer" >authenticate your account</a>. </p><div class="code-block" data-lang="bash"         >gcloud auth login</div></li><li class="list__item" id="ee0d787c_13788"><p>Finally, <a href="https://cloud.google.com/docs/authentication/provide-credentials-adc" id="ee0d787c_13789"   data-external="true" rel="noopener noreferrer" >set up Application Default Credentials (ADC)</a>. </p><div class="code-block" data-lang="bash"         >gcloud auth application-default login</div></li><li class="list__item" id="ee0d787c_13791"><p>To make sure everything is working, <a href="#tests" id="ee0d787c_13792" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  >run the tests</a>.</p></li></ol></section><section class="procedure-steps"   > <div class="collapse" ><div class="collapse__title"  ><h3 id="ee0d787c_13793" data-toc="ee0d787c_13793">Pre-commit Hooks</h3 ></div><div class="collapse__content" ><aside class="prompt" data-type="note" data-title="" id="ee0d787c_13794"><p>This is optional but recommended. Pre-commit hooks are a way to ensure that your code is formatted correctly. This is done by running a series of checks before you commit your code.</p></aside><ul class="list" ><li class="list__item" id="ee0d787c_13795"><div class="code-block" data-lang="bash"         >
+        </div></li></ol></section><section class="procedure-steps"   ><h3 id="gcloud" data-toc="gcloud">Setting Up Google Cloud</h3 ><ol class="list _decimal"><li class="list__item" id="22521d46_3416"><p>We use Google Cloud to store our datasets. To set up Google Cloud, <a href="https://cloud.google.com/sdk/docs/install" id="22521d46_3417"   data-external="true" rel="noopener noreferrer" >install the Google Cloud CLI</a></p></li><li class="list__item" id="22521d46_3418"><p>Then, <a href="https://cloud.google.com/sdk/docs/initializing" id="22521d46_3419"   data-external="true" rel="noopener noreferrer" >authenticate your account</a>. </p><div class="code-block" data-lang="bash"         >gcloud auth login</div></li><li class="list__item" id="22521d46_3421"><p>Finally, <a href="https://cloud.google.com/docs/authentication/provide-credentials-adc" id="22521d46_3422"   data-external="true" rel="noopener noreferrer" >set up Application Default Credentials (ADC)</a>. </p><div class="code-block" data-lang="bash"         >gcloud auth application-default login</div></li><li class="list__item" id="22521d46_3424"><p>To make sure everything is working, <a href="#tests" id="22521d46_3425" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >run the tests</a>.</p></li></ol></section><section class="procedure-steps"   ><h3 id="ls" data-toc="ls">Setting Up Label Studio</h3 ><aside class="prompt" data-type="tip" data-title="" id="22521d46_3426"><p>This is only necessary if any task requires Label Studio annotations</p></aside><ol class="list _decimal"><li class="list__item" id="22521d46_3427"><p>We use Label Studio to annotate our datasets. We won't go through how to install Label Studio, for contributors, it should be up on <code class="code" id="22521d46_3428">localhost:8080</code>.</p></li><li class="list__item" id="22521d46_3429"><p>Then, retrieve your own API key from Label Studio. <a href="http://localhost:8080/user/account" id="22521d46_3430"   data-external="true" rel="noopener noreferrer" >Go to your account page</a> and copy the API key. </p><br></li><li class="list__item" id="22521d46_3432"><p>Set your API key as an environment variable. </p><div class="tabs" id="22521d46_3433"><div class="tabs__content" data-gtm="tab" id="22521d46_3434" data-title="Windows"><p>In Windows, go to &quot;Edit environment variables for your account&quot; and add this as a new environment variable with name <code class="code" id="22521d46_3435">LABEL_STUDIO_API_KEY</code>.</p></div><div class="tabs__content" data-gtm="tab" id="22521d46_3436" data-title="Linux"><p>Export it as an environment variable. </p><div class="code-block" data-lang="bash"    data-title="Shell"     >export LABEL_STUDIO_API_KEY=...</div></div></div></li></ol></section><section class="procedure-steps"   ><h3 id="wandb" data-toc="wandb">Setting Up Weight and Biases</h3 ><ol class="list _decimal"><li class="list__item" id="22521d46_3438"><p>We use W&amp;B to track our experiments. To set up W&amp;B, <a href="https://docs.wandb.ai/quickstart" id="22521d46_3439"   data-external="true" rel="noopener noreferrer" >install the W&amp;B CLI</a></p></li><li class="list__item" id="22521d46_3440"><p>Then, <a href="https://docs.wandb.ai/quickstart" id="22521d46_3441"   data-external="true" rel="noopener noreferrer" >authenticate your account</a>. </p><div class="code-block" data-lang="bash"         >wandb login</div></li></ol></section><section class="procedure-steps"   > <div class="collapse" ><div class="collapse__title"  ><h3 id="22521d46_3443" data-toc="22521d46_3443">Pre-commit Hooks</h3 ></div><div class="collapse__content" ><aside class="prompt" data-type="note" data-title="" id="22521d46_3444"><p>This is optional but recommended. Pre-commit hooks are a way to ensure that your code is formatted correctly. This is done by running a series of checks before you commit your code.</p></aside><ul class="list" ><li class="list__item" id="22521d46_3445"><div class="code-block" data-lang="bash"         >
             pre-commit install
-        </div></li></ul></div ></div></section><section class="procedure-steps"   > <div class="collapse" ><div class="collapse__title"  ><h3 id="tests" data-toc="tests">Running the Tests</h3 ></div><div class="collapse__content" ><ol class="list _decimal"><li class="list__item" id="ee0d787c_13797"><p>Run the tests to make sure everything is working </p><div class="code-block" data-lang="bash"         >
+        </div></li></ul></div ></div></section><section class="procedure-steps"   ><h3 id="tests" data-toc="tests">Running the Tests</h3 ><ul class="list" ><li class="list__item" id="22521d46_3447"><p>Run the tests to make sure everything is working </p><div class="code-block" data-lang="bash"         >
             pytest
-        </div></li><li class="list__item" id="ee0d787c_13799"><p>In case of errors: </p><dl id="ee0d787c_13800" data-style="title-top"><dt id="ee0d787c_13801" data-expandable="false">google.auth.exceptions.DefaultCredentialsError</dt><dd><p>If you get this error, it means that you haven't authenticated your Google Cloud account. See <a href="#gcloud" id="ee0d787c_13802" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  >Setting Up Google Cloud</a></p></dd><dt id="ee0d787c_13803" data-expandable="false">ModuleNotFoundError</dt><dd><p>If you get this error, it means that you haven't installed the dependencies. See <a href="#install" id="ee0d787c_13804" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  >Installing the Dev. Environment</a></p></dd></dl></li></ol></div ></div></section><section class="chapter"><h2 id="our-repository-structure" data-toc="our-repository-structure"   >Our Repository Structure</h2><p id="ee0d787c_13805">Before starting development, take a look at our repository structure. This will help you understand where to put your code.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 820.171875 638"  xmlns="http://www.w3.org/2000/svg" width="820.171875" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-src/frdc/" id="L-FRDC-src/frdc/-0" d="M33.00868941326531,420L51.91479326105442,373.8333333333333C70.82089710884354,327.6666666666667,108.63310480442176,235.33333333333334,153.89728156887756,189.16666666666666C199.16145833333334,143,251.87760416666666,143,278.2356770833333,143L304.59375,143"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-rsc/" id="L-FRDC-rsc/-0" d="M50.41322544642857,420L66.41857328869047,408.8333333333333C82.42392113095238,397.6666666666667,114.43461681547619,375.3333333333333,159.91131882440476,364.1666666666667C205.38802083333334,353,264.3307291666667,353,293.8020833333333,353L323.2734375,353"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-pipeline/" id="L-FRDC-pipeline/-0" d="M52.09375,437L67.81901041666667,437C83.54427083333333,437,114.99479166666667,437,157.08723958333334,437C199.1796875,437,251.9140625,437,278.28125,437L304.6484375,437"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-tests/" id="L-FRDC-tests/-0" d="M50.41322544642857,454L66.41857328869047,465.1666666666667C82.42392113095238,476.3333333333333,114.43461681547619,498.6666666666667,158.76548549107142,509.8333333333333C203.09635416666666,521,259.7473958333333,521,288.0729166666667,521L316.3984375,521"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-pyproject.toml,poetry.lock" id="L-FRDC-pyproject.toml,poetry.lock-0" d="M38.230050223214285,454L56.26592726934524,479.1666666666667C74.30180431547619,504.3333333333333,110.37355840773809,554.6666666666666,144.13469587053572,579.8333333333334C177.89583333333334,605,209.34635416666666,605,225.07161458333334,605L240.796875,605"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./load/" id="L-src/frdc/-./load/-0" d="M373.9213169642857,126L404.5268787202381,107.83333333333333C435.13244047619054,89.66666666666667,496.34356398809524,53.333333333333336,550.7928757440476,35.166666666666664C605.2421875,17,652.9296875,17,676.7734375,17L700.6171875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./preprocess/" id="L-src/frdc/-./preprocess/-0" d="M385.96875,134.94965220271612L414.56640625,129.29137683559676C443.1640625,123.63310146847742,500.359375,112.31655073423872,548.9205729166666,106.65827536711936C597.4817708333334,101,637.4088541666666,101,657.3723958333334,101L677.3359375,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./train/" id="L-src/frdc/-./train/-0" d="M385.96875,151.05034779728388L414.56640625,156.70862316440324C443.1640625,162.3668985315226,500.359375,173.68344926576128,552.49609375,179.34172463288064C604.6328125,185,651.7109375,185,675.25,185L698.7890625,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./models/" id="L-src/frdc/-./models/-0" d="M373.9213169642857,160L404.5268787202381,178.16666666666666C435.13244047619054,196.33333333333334,496.34356398809524,232.66666666666666,549.1196986607143,250.83333333333334C601.8958333333334,269,646.2369791666666,269,668.4075520833334,269L690.578125,269"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-rsc/ LE-./dataset_name/" id="L-rsc/-./dataset_name/-0" d="M367.2890625,353L399,353C430.7109375,353,494.1328125,353,543.80859375,353C593.484375,353,629.4140625,353,647.37890625,353L665.34375,353"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-pipeline/ LE-./model_tests/" id="L-pipeline/-./model_tests/-0" d="M385.9140625,437L414.5208333333333,437C443.1276041666667,437,500.3411458333333,437,548.0950520833334,437C595.8489583333334,437,634.1432291666666,437,653.2903645833334,437L672.4375,437"></path></g><g class="edgeLabels"><g transform="translate(146.4453125, 143)" class="edgeLabel"><g transform="translate(-68.4609375, -9.5)" class="label"><foreignObject height="19" width="136.921875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Core Dependencies</span></div></foreignObject></g></g><g transform="translate(146.4453125, 353)" class="edgeLabel"><g transform="translate(-35.2734375, -9.5)" class="label"><foreignObject height="19" width="70.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Resources</span></div></foreignObject></g></g><g transform="translate(146.4453125, 437)" class="edgeLabel"><g transform="translate(-28.5625, -9.5)" class="label"><foreignObject height="19" width="57.125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Pipeline</span></div></foreignObject></g></g><g transform="translate(146.4453125, 521)" class="edgeLabel"><g transform="translate(-17.6640625, -9.5)" class="label"><foreignObject height="19" width="35.328125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Tests</span></div></foreignObject></g></g><g transform="translate(146.4453125, 605)" class="edgeLabel"><g transform="translate(-69.3515625, -9.5)" class="label"><foreignObject height="19" width="138.703125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Repo Dependencies</span></div></foreignObject></g></g><g transform="translate(557.5546875, 17)" class="edgeLabel"><g transform="translate(-57.3828125, -9.5)" class="label"><foreignObject height="19" width="114.765625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Dataset Loaders</span></div></foreignObject></g></g><g transform="translate(557.5546875, 101)" class="edgeLabel"><g transform="translate(-62.8046875, -9.5)" class="label"><foreignObject height="19" width="125.609375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Preprocessing Fn.</span></div></foreignObject></g></g><g transform="translate(557.5546875, 185)" class="edgeLabel"><g transform="translate(-37.109375, -9.5)" class="label"><foreignObject height="19" width="74.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Train Deps</span></div></foreignObject></g></g><g transform="translate(557.5546875, 269)" class="edgeLabel"><g transform="translate(-71.3125, -9.5)" class="label"><foreignObject height="19" width="142.625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Model Architectures</span></div></foreignObject></g></g><g transform="translate(557.5546875, 353)" class="edgeLabel"><g transform="translate(-41.71875, -9.5)" class="label"><foreignObject height="19" width="83.4375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Datasets ...</span></div></foreignObject></g></g><g transform="translate(557.5546875, 437)" class="edgeLabel"><g transform="translate(-82.7890625, -9.5)" class="label"><foreignObject height="19" width="165.578125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Model Training Pipeline</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(26.046875, 437)" id="flowchart-FRDC-44" class="node default default flowchart-label"><rect height="34" width="52.09375" y="-17" x="-26.046875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-18.546875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="37.09375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">FRDC</span></div></foreignObject></g></g><g transform="translate(345.28125, 143)" id="flowchart-src/frdc/-45" class="node default default flowchart-label"><rect height="34" width="81.375" y="-17" x="-40.6875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-33.1875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="66.375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">src/frdc/</span></div></foreignObject></g></g><g transform="translate(345.28125, 353)" id="flowchart-rsc/-47" class="node default default flowchart-label"><rect height="34" width="44.015625" y="-17" x="-22.0078125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-14.5078125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="29.015625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">rsc/</span></div></foreignObject></g></g><g transform="translate(345.28125, 437)" id="flowchart-pipeline/-49" class="node default default flowchart-label"><rect height="34" width="81.265625" y="-17" x="-40.6328125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-33.1328125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="66.265625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">pipeline/</span></div></foreignObject></g></g><g transform="translate(345.28125, 521)" id="flowchart-tests/-51" class="node default default flowchart-label"><rect height="34" width="57.765625" y="-17" x="-28.8828125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-21.3828125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="42.765625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">tests/</span></div></foreignObject></g></g><g transform="translate(345.28125, 605)" id="flowchart-pyproject.toml,poetry.lock-53" class="node default default flowchart-label"><rect height="34" width="208.96875" y="-17" x="-104.484375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-96.984375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="193.96875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">pyproject.toml,poetry.lock</span></div></foreignObject></g></g><g transform="translate(734.7578125, 17)" id="flowchart-./load/-55" class="node default default flowchart-label"><rect height="34" width="68.28125" y="-17" x="-34.140625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-26.640625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="53.28125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./load/</span></div></foreignObject></g></g><g transform="translate(734.7578125, 101)" id="flowchart-./preprocess/-57" class="node default default flowchart-label"><rect height="34" width="114.84375" y="-17" x="-57.421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-49.921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="99.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./preprocess/</span></div></foreignObject></g></g><g transform="translate(734.7578125, 185)" id="flowchart-./train/-59" class="node default default flowchart-label"><rect height="34" width="71.9375" y="-17" x="-35.96875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-28.46875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="56.9375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./train/</span></div></foreignObject></g></g><g transform="translate(734.7578125, 269)" id="flowchart-./models/-61" class="node default default flowchart-label"><rect height="34" width="88.359375" y="-17" x="-44.1796875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-36.6796875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="73.359375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./models/</span></div></foreignObject></g></g><g transform="translate(734.7578125, 353)" id="flowchart-./dataset_name/-63" class="node default default flowchart-label"><rect height="34" width="138.828125" y="-17" x="-69.4140625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-61.9140625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="123.828125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./dataset_name/</span></div></foreignObject></g></g><g transform="translate(734.7578125, 437)" id="flowchart-./model_tests/-65" class="node default default flowchart-label"><rect height="34" width="124.640625" y="-17" x="-62.3203125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-54.8203125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="109.640625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./model_tests/</span></div></foreignObject></g></g></g></g></g></svg><dl id="ee0d787c_13807" data-style="title-top"><dt id="ee0d787c_13808" data-expandable="false">src/frdc/</dt><dd><p id="ee0d787c_13810">Source Code for our package. These are the unit components of our pipeline.</p></dd><dt id="ee0d787c_13811" data-expandable="false">rsc/</dt><dd><p id="ee0d787c_13813">Resources. These are usually cached datasets</p></dd><dt id="ee0d787c_13814" data-expandable="false">pipeline/</dt><dd><p id="ee0d787c_13816">Pipeline code. These are the full ML tests of our pipeline.</p></dd><dt id="ee0d787c_13817" data-expandable="false">tests/</dt><dd><p id="ee0d787c_13819">PyTest tests. These are unit tests &amp; integration tests.</p></dd></dl><section class="chapter"><h3 id="unit-integration-and-pipeline-tests" data-toc="unit-integration-and-pipeline-tests"   >Unit, Integration, and Pipeline Tests</h3><p id="ee0d787c_13820">We have 3 types of tests:</p><ul class="list _ul" id="ee0d787c_13821"><li class="list__item" id="ee0d787c_13822"><p>Unit Tests are usually small, single function tests.</p></li><li class="list__item" id="ee0d787c_13823"><p>Integration Tests are larger tests that tests a mock pipeline.</p></li><li class="list__item" id="ee0d787c_13824"><p>Pipeline Tests are the true production pipeline tests that will generate a model.</p></li></ul></section><section class="chapter"><h3 id="where-should-i-contribute" data-toc="where-should-i-contribute"   >Where Should I contribute?</h3><dl id="ee0d787c_13825" data-style="title-top"><dt id="ee0d787c_13826" data-expandable="false">Changing a small component</dt><dd><p>If you're changing a small component, such as a argument for preprocessing, a new model architecture, or a new configuration for a dataset, take a look at the <code class="code" id="ee0d787c_13827">src/frdc/</code> directory.</p></dd><dt id="ee0d787c_13828" data-expandable="false">Adding a test</dt><dd><p>By adding a new component, you'll need to add a new test. Take a look at the <code class="code" id="ee0d787c_13829">tests/</code> directory.</p></dd><dt id="ee0d787c_13830" data-expandable="false">Changing the pipeline</dt><dd><p>If you're a ML Researcher, you'll probably be changing the pipeline. Take a look at the <code class="code" id="ee0d787c_13831">pipeline/</code> directory.</p></dd><dt id="ee0d787c_13832" data-expandable="false">Adding a dependency</dt><dd><p>If you're adding a new dependency, use <code class="code" id="ee0d787c_13833">poetry add PACKAGE</code> and commit the changes to <code class="code" id="ee0d787c_13834">pyproject.toml</code> and <code class="code" id="ee0d787c_13835">poetry.lock</code>. </p><aside class="prompt" data-type="note" data-title="" id="ee0d787c_13836"><p>E.g. Adding <code class="code" id="ee0d787c_13837">numpy</code> is the same as <code class="code" id="ee0d787c_13838">poetry add numpy</code></p></aside></dd></dl></section></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="overview.html">Overview</a>   <a class="navigation-links__next" href="retrieve-our-datasets.html">Retrieve our Datasets</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+        </div></li></ul></section><section class="chapter"><h2 id="troubleshooting" data-toc="troubleshooting"   >Troubleshooting</h2><section class="chapter"><h3 id="modulenotfounderror" data-toc="modulenotfounderror"   >ModuleNotFoundError</h3><p id="22521d46_3449">It's likely that your <code class="code" id="22521d46_3450">src</code> and <code class="code" id="22521d46_3451">tests</code> directories are not in <code class="code" id="22521d46_3452">PYTHONPATH</code>. To fix this, run the following command:</p><div class="code-block" data-lang="bash"         >
+export PYTHONPATH=$PYTHONPATH:./src:./tests
+</div><p id="22521d46_3454">Or, set it in your IDE, for example, IntelliJ allows setting directories as <span class="control" id="22521d46_3455">Source Roots</span>.</p></section><section class="chapter"><h3 id="google-auth-exceptions-defaultcredentialserror" data-toc="google-auth-exceptions-defaultcredentialserror"   >google.auth.exceptions.DefaultCredentialsError</h3><p id="22521d46_3456">It's likely that you haven't authenticated your Google Cloud account. See <a href="#gcloud" id="22521d46_3457" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Setting Up Google Cloud</a></p></section><section class="chapter"><h3 id="couldn-t-connect-to-label-studio" data-toc="couldn-t-connect-to-label-studio"   >Couldn't connect to Label Studio</h3><p id="22521d46_3458">Label Studio must be running locally, exposed on <code class="code" id="22521d46_3459">localhost:8080</code>. Furthermore, you need to specify the <code class="code" id="22521d46_3460">LABEL_STUDIO_API_KEY</code> environment variable. See <a href="#ls" id="22521d46_3461" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Setting Up Label Studio</a></p></section><section class="chapter"><h3 id="cannot-login-to-w-b" data-toc="cannot-login-to-w-b"   >Cannot login to W&amp;B</h3><p id="22521d46_3462">You need to authenticate your W&amp;B account. See <a href="#wandb" id="22521d46_3463" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Setting Up Weight and Biases</a> If you're facing difficulties, set the <code class="code" id="22521d46_3464">WANDB_MODE</code> environment variable to <code class="code" id="22521d46_3465">offline</code> to disable W&amp;B.</p></section></section><section class="chapter"><h2 id="our-repository-structure" data-toc="our-repository-structure"   >Our Repository Structure</h2><p id="22521d46_3466">Before starting development, take a look at our repository structure. This will help you understand where to put your code.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 797.21875 554"  xmlns="http://www.w3.org/2000/svg" width="797.21875" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-src/frdc/" id="L-FRDC-src/frdc/-0" d="M34.16899181547619,378L52.881711929563494,338.8333333333333C71.5944320436508,299.6666666666667,109.0198722718254,221.33333333333334,154.09066530257937,182.16666666666666C199.16145833333334,143,251.87760416666666,143,278.2356770833333,143L304.59375,143"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-rsc/" id="L-FRDC-rsc/-0" d="M52.09375,385.91376289663225L67.81901041666667,380.4281357471935C83.54427083333333,374.94250859775485,114.99479166666667,363.97125429887745,160.19140625,358.4856271494387C205.38802083333334,353,264.3307291666667,353,293.8020833333333,353L323.2734375,353"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-tests/" id="L-FRDC-tests/-0" d="M52.09375,404.08623710336775L67.81901041666667,409.5718642528065C83.54427083333333,415.05749140224515,114.99479166666667,426.02874570112255,159.04557291666666,431.5143728505613C203.09635416666666,437,259.7473958333333,437,288.0729166666667,437L316.3984375,437"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FRDC LE-pyproject.toml,poetry.lock" id="L-FRDC-pyproject.toml,poetry.lock-0" d="M42.29110863095238,412L59.65014260912699,430.1666666666667C77.00917658730158,448.3333333333333,111.7272445436508,484.6666666666667,144.81153893849208,502.8333333333333C177.89583333333334,521,209.34635416666666,521,225.07161458333334,521L240.796875,521"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./load/" id="L-src/frdc/-./load/-0" d="M372.37289186507934,126L401.32376405423275,107.83333333333333C430.27463624338617,89.66666666666667,488.1763806216931,53.333333333333336,539.05824239418,35.166666666666664C589.9401041666666,17,633.8020833333334,17,655.7330729166666,17L677.6640625,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./preprocess/" id="L-src/frdc/-./preprocess/-0" d="M385.96875,134.48953388841335L412.6536458333333,128.9079449070111C439.3385416666667,123.3263559256089,492.7083333333333,112.16317796280445,537.4440104166666,106.58158898140222C582.1796875,101,618.28125,101,636.33203125,101L654.3828125,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./train/" id="L-src/frdc/-./train/-0" d="M385.96875,151.51046611158665L412.6536458333333,157.0920550929889C439.3385416666667,162.6736440743911,492.7083333333333,173.83682203719556,541.01953125,179.41841101859777C589.3307291666666,185,632.5833333333334,185,654.2096354166666,185L675.8359375,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-src/frdc/ LE-./models/" id="L-src/frdc/-./models/-0" d="M372.37289186507934,160L401.32376405423275,178.16666666666666C430.27463624338617,196.33333333333334,488.1763806216931,232.66666666666666,537.3850653108466,250.83333333333334C586.59375,269,627.109375,269,647.3671875,269L667.625,269"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-rsc/ LE-./dataset_name/" id="L-rsc/-./dataset_name/-0" d="M367.2890625,353L397.0872395833333,353C426.8854166666667,353,486.4817708333333,353,532.33203125,353C578.1822916666666,353,610.2864583333334,353,626.3385416666666,353L642.390625,353"></path></g><g class="edgeLabels"><g transform="translate(146.4453125, 143)" class="edgeLabel"><g transform="translate(-68.4609375, -9.5)" class="label"><foreignObject height="19" width="136.921875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Core Dependencies</span></div></foreignObject></g></g><g transform="translate(146.4453125, 353)" class="edgeLabel"><g transform="translate(-35.2734375, -9.5)" class="label"><foreignObject height="19" width="70.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Resources</span></div></foreignObject></g></g><g transform="translate(146.4453125, 437)" class="edgeLabel"><g transform="translate(-17.6640625, -9.5)" class="label"><foreignObject height="19" width="35.328125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Tests</span></div></foreignObject></g></g><g transform="translate(146.4453125, 521)" class="edgeLabel"><g transform="translate(-69.3515625, -9.5)" class="label"><foreignObject height="19" width="138.703125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Repo Dependencies</span></div></foreignObject></g></g><g transform="translate(546.078125, 17)" class="edgeLabel"><g transform="translate(-57.3828125, -9.5)" class="label"><foreignObject height="19" width="114.765625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Dataset Loaders</span></div></foreignObject></g></g><g transform="translate(546.078125, 101)" class="edgeLabel"><g transform="translate(-62.8046875, -9.5)" class="label"><foreignObject height="19" width="125.609375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Preprocessing Fn.</span></div></foreignObject></g></g><g transform="translate(546.078125, 185)" class="edgeLabel"><g transform="translate(-37.109375, -9.5)" class="label"><foreignObject height="19" width="74.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Train Deps</span></div></foreignObject></g></g><g transform="translate(546.078125, 269)" class="edgeLabel"><g transform="translate(-71.3125, -9.5)" class="label"><foreignObject height="19" width="142.625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Model Architectures</span></div></foreignObject></g></g><g transform="translate(546.078125, 353)" class="edgeLabel"><g transform="translate(-41.71875, -9.5)" class="label"><foreignObject height="19" width="83.4375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Datasets ...</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(26.046875, 395)" id="flowchart-FRDC-54" class="node default default flowchart-label"><rect height="34" width="52.09375" y="-17" x="-26.046875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-18.546875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="37.09375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">FRDC</span></div></foreignObject></g></g><g transform="translate(345.28125, 143)" id="flowchart-src/frdc/-55" class="node default default flowchart-label"><rect height="34" width="81.375" y="-17" x="-40.6875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-33.1875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="66.375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">src/frdc/</span></div></foreignObject></g></g><g transform="translate(345.28125, 353)" id="flowchart-rsc/-57" class="node default default flowchart-label"><rect height="34" width="44.015625" y="-17" x="-22.0078125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-14.5078125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="29.015625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">rsc/</span></div></foreignObject></g></g><g transform="translate(345.28125, 437)" id="flowchart-tests/-59" class="node default default flowchart-label"><rect height="34" width="57.765625" y="-17" x="-28.8828125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-21.3828125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="42.765625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">tests/</span></div></foreignObject></g></g><g transform="translate(345.28125, 521)" id="flowchart-pyproject.toml,poetry.lock-61" class="node default default flowchart-label"><rect height="34" width="208.96875" y="-17" x="-104.484375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-96.984375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="193.96875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">pyproject.toml,poetry.lock</span></div></foreignObject></g></g><g transform="translate(711.8046875, 17)" id="flowchart-./load/-63" class="node default default flowchart-label"><rect height="34" width="68.28125" y="-17" x="-34.140625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-26.640625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="53.28125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./load/</span></div></foreignObject></g></g><g transform="translate(711.8046875, 101)" id="flowchart-./preprocess/-65" class="node default default flowchart-label"><rect height="34" width="114.84375" y="-17" x="-57.421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-49.921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="99.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./preprocess/</span></div></foreignObject></g></g><g transform="translate(711.8046875, 185)" id="flowchart-./train/-67" class="node default default flowchart-label"><rect height="34" width="71.9375" y="-17" x="-35.96875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-28.46875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="56.9375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./train/</span></div></foreignObject></g></g><g transform="translate(711.8046875, 269)" id="flowchart-./models/-69" class="node default default flowchart-label"><rect height="34" width="88.359375" y="-17" x="-44.1796875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-36.6796875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="73.359375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./models/</span></div></foreignObject></g></g><g transform="translate(711.8046875, 353)" id="flowchart-./dataset_name/-71" class="node default default flowchart-label"><rect height="34" width="138.828125" y="-17" x="-69.4140625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-61.9140625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="123.828125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">./dataset_name/</span></div></foreignObject></g></g></g></g></g></svg><dl id="22521d46_3468" data-style="title-top"><dt id="22521d46_3469" data-expandable="false">src/frdc/</dt><dd><p id="22521d46_3471">Source Code for our package. These are the unit components of our pipeline.</p></dd><dt id="22521d46_3472" data-expandable="false">rsc/</dt><dd><p id="22521d46_3474">Resources. These are usually cached datasets</p></dd><dt id="22521d46_3475" data-expandable="false">tests/</dt><dd><p id="22521d46_3477">PyTest tests. These are unit, integration, and model tests.</p></dd></dl><section class="chapter"><h3 id="unit-integration-and-pipeline-tests" data-toc="unit-integration-and-pipeline-tests"   >Unit, Integration, and Pipeline Tests</h3><p id="22521d46_3478">We have 3 types of tests:</p><ul class="list _ul" id="22521d46_3479"><li class="list__item" id="22521d46_3480"><p>Unit Tests are usually small, single function tests.</p></li><li class="list__item" id="22521d46_3481"><p>Integration Tests are larger tests that tests a mock pipeline.</p></li><li class="list__item" id="22521d46_3482"><p>Model Tests are the true production pipeline tests that will generate a model.</p></li></ul></section><section class="chapter"><h3 id="where-should-i-contribute" data-toc="where-should-i-contribute"   >Where Should I contribute?</h3><dl id="22521d46_3483" data-style="title-top"><dt id="22521d46_3484" data-expandable="false">Changing a small component</dt><dd><p>If you're changing a small component, such as a argument for preprocessing, a new model architecture, or a new configuration for a dataset, take a look at the <code class="code" id="22521d46_3485">src/frdc/</code> directory.</p></dd><dt id="22521d46_3486" data-expandable="false">Adding a test</dt><dd><p>By adding a new component, you'll need to add a new test. Take a look at the <code class="code" id="22521d46_3487">tests/</code> directory.</p></dd><dt id="22521d46_3488" data-expandable="false">Changing the model pipeline</dt><dd><p>If you're a ML Researcher, you'll probably be changing the pipeline. Take a look at the <code class="code" id="22521d46_3489">tests/model_tests/</code> directory.</p></dd><dt id="22521d46_3490" data-expandable="false">Adding a dependency</dt><dd><p>If you're adding a new dependency, use <code class="code" id="22521d46_3491">poetry add PACKAGE</code> and commit the changes to <code class="code" id="22521d46_3492">pyproject.toml</code> and <code class="code" id="22521d46_3493">poetry.lock</code>. </p><aside class="prompt" data-type="note" data-title="" id="22521d46_3494"><p>E.g. Adding <code class="code" id="22521d46_3495">numpy</code> is the same as <code class="code" id="22521d46_3496">poetry add numpy</code></p></aside></dd></dl></section></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="overview.html">Overview</a>   <a class="navigation-links__next" href="get-started-with-dev-containers.html">Get Started with Dev Containers</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/load-dataset.html b/docs/load-dataset.html
index 09a97fb1..8ae04891 100644
--- a/docs/load-dataset.html
+++ b/docs/load-dataset.html
@@ -1,14 +1,12 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>load.dataset | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"filters","level":0,"title":"Filters","anchor":"#filters"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="load.dataset | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/load-dataset.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="load.dataset | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/load-dataset.html#webpage", "url": "/d/0.0.7/load-dataset.html", "name": "load.dataset | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="load.dataset" data-main-title="load.dataset" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="load.dataset"   id="load.dataset.md">load.dataset</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;92a10ff7_376\&quot;\u003eLoad dataset objects from our GCS bucket.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="warning" data-title="" id="92a10ff7_336"><p id="92a10ff7_337">You need to Set-Up <a href="getting-started.html#gcloud" id="92a10ff7_338" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  >Google Cloud</a> with the appropriate permissions to use this library.</p></aside><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="92a10ff7_340">Firstly, to load a dataset instance, you need to initiliaze a <code class="code" id="92a10ff7_341">FRDCDataset</code> object, providing the site, date, and version.</p><p id="92a10ff7_342">For example, to load our Chestnut Nature Park dataset.</p><div class="code-block" data-lang="python"         >
-from frdc.load import FRDCDataset
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>load.dataset | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"filters","level":0,"title":"Filters","anchor":"#filters"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="load.dataset | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/load-dataset.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="load.dataset | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/load-dataset.html#webpage", "url": "/d/0.0.8/load-dataset.html", "name": "load.dataset | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="load.dataset" data-main-title="load.dataset" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="load.dataset"   id="load.dataset.md">load.dataset</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;a73e9a78_271\&quot;\u003eLoad dataset objects from our GCS bucket.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="warning" data-title="" id="a73e9a78_231"><p id="a73e9a78_232">You need to Set-Up <a href="getting-started.html#gcloud" id="a73e9a78_233" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Google Cloud</a> with the appropriate permissions to use this library.</p></aside><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="a73e9a78_235">Firstly, to load a dataset instance, you need to initiliaze a <code class="code" id="a73e9a78_236">FRDCDataset</code> object, providing the site, date, and version.</p><p id="a73e9a78_237">For example, to load our Chestnut Nature Park dataset.</p><div class="code-block" data-lang="python"         >
+from frdc.load.preset import FRDCDatasetPreset
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None)
-</div><p id="92a10ff7_344">Then, we can use the <code class="code" id="92a10ff7_345">ds</code> object to load objects of the dataset:</p><div class="code-block" data-lang="python"         >
+ds = FRDCDatasetPreset.chestnut_20201218()
+</div><p id="a73e9a78_239">Then, we can use the <code class="code" id="a73e9a78_240">ds</code> object to load objects of the dataset:</p><div class="code-block" data-lang="python"         >
 ar, order = ds.get_ar_bands()
 d = ds.get_ar_bands_as_dict()
 bounds, labels = ds.get_bounds_and_labels()
-</div><ul class="list _ul" id="92a10ff7_347"><li class="list__item" id="92a10ff7_348"><p><code class="code" id="92a10ff7_349">ar</code> is a stacked NDArray of the hyperspectral bands of shape (H x W x C)</p></li><li class="list__item" id="92a10ff7_350"><p><code class="code" id="92a10ff7_351">order</code> is a list of strings, containing the names of the bands, ordered according to the channels of <code class="code" id="92a10ff7_352">ar</code></p></li><li class="list__item" id="92a10ff7_353"><p><code class="code" id="92a10ff7_354">d</code> is a dictionary of the hyperspectral bands of shape (H x W), keyed by the band names</p></li><li class="list__item" id="92a10ff7_355"><p><code class="code" id="92a10ff7_356">bounds</code> is a list of bounding boxes, in the format of <code class="code" id="92a10ff7_357">Rect</code>, a <code class="code" id="92a10ff7_358">namedtuple</code> of x0, y0, x1, y1</p></li><li class="list__item" id="92a10ff7_359"><p><code class="code" id="92a10ff7_360">labels</code> is a list of strings, containing the labels of the bounding boxes, ordered according to <code class="code" id="92a10ff7_361">bounds</code></p></li></ul><aside class="prompt" data-type="note" data-title="" id="92a10ff7_362"><p id="92a10ff7_363"><code class="code" id="92a10ff7_364">get_ar_bands()</code> and <code class="code" id="92a10ff7_365">get_ar_bands_as_dict()</code> retrieves the same data, but <code class="code" id="92a10ff7_366">get_ar_bands()</code> is a convenience function that stacks the bands into a single NDArray, and returns the channel order as well.</p></aside></section><section class="chapter"><h2 id="filters" data-toc="filters"   >Filters</h2><p id="92a10ff7_367">You can also selectively get the channels for both <code class="code" id="92a10ff7_368">get_ar_bands()</code> and <code class="code" id="92a10ff7_369">get_ar_bands_as_dict()</code> by providing a list of strings to the <code class="code" id="92a10ff7_370">bands</code> argument.</p><p id="92a10ff7_371">For example, to get the Wideband RGB bands, you can do:</p><div class="code-block" data-lang="python"         >
+</div><ul class="list _ul" id="a73e9a78_242"><li class="list__item" id="a73e9a78_243"><p><code class="code" id="a73e9a78_244">ar</code> is a stacked NDArray of the hyperspectral bands of shape (H x W x C)</p></li><li class="list__item" id="a73e9a78_245"><p><code class="code" id="a73e9a78_246">order</code> is a list of strings, containing the names of the bands, ordered according to the channels of <code class="code" id="a73e9a78_247">ar</code></p></li><li class="list__item" id="a73e9a78_248"><p><code class="code" id="a73e9a78_249">d</code> is a dictionary of the hyperspectral bands of shape (H x W), keyed by the band names</p></li><li class="list__item" id="a73e9a78_250"><p><code class="code" id="a73e9a78_251">bounds</code> is a list of bounding boxes, in the format of <code class="code" id="a73e9a78_252">Rect</code>, a <code class="code" id="a73e9a78_253">namedtuple</code> of x0, y0, x1, y1</p></li><li class="list__item" id="a73e9a78_254"><p><code class="code" id="a73e9a78_255">labels</code> is a list of strings, containing the labels of the bounding boxes, ordered according to <code class="code" id="a73e9a78_256">bounds</code></p></li></ul><aside class="prompt" data-type="note" data-title="" id="a73e9a78_257"><p id="a73e9a78_258"><code class="code" id="a73e9a78_259">get_ar_bands()</code> and <code class="code" id="a73e9a78_260">get_ar_bands_as_dict()</code> retrieves the same data, but <code class="code" id="a73e9a78_261">get_ar_bands()</code> is a convenience function that stacks the bands into a single NDArray, and returns the channel order as well.</p></aside></section><section class="chapter"><h2 id="filters" data-toc="filters"   >Filters</h2><p id="a73e9a78_262">You can also selectively get the channels for both <code class="code" id="a73e9a78_263">get_ar_bands()</code> and <code class="code" id="a73e9a78_264">get_ar_bands_as_dict()</code> by providing a list of strings to the <code class="code" id="a73e9a78_265">bands</code> argument.</p><p id="a73e9a78_266">For example, to get the Wideband RGB bands, you can do:</p><div class="code-block" data-lang="python"         >
 ar, order = ds.get_ar_bands(bands=['WR', 'WG', 'WB'])
 d = ds.get_ar_bands_as_dict(bands=['WR', 'WG', 'WB'])
-</div><p id="92a10ff7_373">This will also alter the channel order to the order of the bands provided.</p><p id="92a10ff7_374">See <a href="load-gcs.html#configuration" id="92a10ff7_375" data-tooltip="If you need granular control over"  >load.gcs</a> for configuration options.</p></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="model-test-chestnut-may-dec.html">Model Test Chestnut May-Dec</a>   <a class="navigation-links__next" href="load-gcs.html">load.gcs</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><p id="a73e9a78_268">This will also alter the channel order to the order of the bands provided.</p><p id="a73e9a78_269">See <a href="load-gcs.html#configuration" id="a73e9a78_270" data-tooltip="If you need granular control over"  >load.gcs</a> for configuration options.</p></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="model-test-chestnut-may-dec.html">Model Test Chestnut May-Dec</a>   <a class="navigation-links__next" href="load-gcs.html">load.gcs</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/load-gcs.html b/docs/load-gcs.html
index e135d6e1..ff221005 100644
--- a/docs/load-gcs.html
+++ b/docs/load-gcs.html
@@ -1,11 +1,11 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>load.gcs | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"usage","level":0,"title":"Usage","anchor":"#usage"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="load.gcs | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/load-gcs.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="load.gcs | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/load-gcs.html#webpage", "url": "/d/0.0.7/load-gcs.html", "name": "load.gcs | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="load.gcs" data-main-title="load.gcs" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="load.gcs"   id="load.gcs.md">load.gcs</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;573e5df3_2997\&quot;\u003eLow-level GCS utilities to automatically download and load objects from GCS.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="warning" data-title="" id="573e5df3_2951"><p id="573e5df3_2952"><a href="getting-started.html#gcloud" id="573e5df3_2953" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  >Set-Up Google Cloud</a> to use this library.</p></aside><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="573e5df3_2955">These are defined in the top-level load.gcs module.</p><dl id="573e5df3_2956" data-style="title-top"><dt id="573e5df3_2957" data-expandable="false">list_gcs_datasets</dt><dd><p>Lists all datasets in the bucket as a DataFrame. This works by checking which folders have a specific file, which we call the <code class="code" id="573e5df3_2958">anchor</code>.</p></dd></dl><aside class="prompt" data-type="tip" data-title="" id="573e5df3_2959"><p id="573e5df3_2960">All functions below will download the file if it doesn't exist locally. It also checks the hash of the file, thus will not redundantly download</p></aside><dl id="573e5df3_2961" data-style="title-top"><dt id="573e5df3_2962" data-expandable="false">download</dt><dd><p>Downloads a file from Google Cloud Storage and returns the local file path.</p></dd><dt id="573e5df3_2963" data-expandable="false">open_file</dt><dd><p>Downloads and opens a file from Google Cloud Storage. Returns a file handle.</p></dd><dt id="573e5df3_2964" data-expandable="false">open_image</dt><dd><p>Downloads and returns the PIL image from Google Cloud Storage.</p></dd></dl><section class="chapter"><h3 id="pathing" data-toc="pathing"   >Pathing</h3><p id="573e5df3_2965">The path to specify is relative to the bucket, which is <code class="code" id="573e5df3_2966">frdc-ds</code> by default.</p><p id="573e5df3_2967">For example this filesystem on GCS:</p><div class="code-block" data-lang="none"         >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>load.gcs | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"usage","level":0,"title":"Usage","anchor":"#usage"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="load.gcs | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/load-gcs.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="load.gcs | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/load-gcs.html#webpage", "url": "/d/0.0.8/load-gcs.html", "name": "load.gcs | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="load.gcs" data-main-title="load.gcs" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="load.gcs"   id="load.gcs.md">load.gcs</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;e71da0fb_1525\&quot;\u003eLow-level GCS utilities to automatically download and load objects from GCS.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="warning" data-title="" id="e71da0fb_1479"><p id="e71da0fb_1480"><a href="getting-started.html#gcloud" id="e71da0fb_1481" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Set-Up Google Cloud</a> to use this library.</p></aside><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="e71da0fb_1483">These are defined in the top-level load.gcs module.</p><dl id="e71da0fb_1484" data-style="title-top"><dt id="e71da0fb_1485" data-expandable="false">list_gcs_datasets</dt><dd><p>Lists all datasets in the bucket as a DataFrame. This works by checking which folders have a specific file, which we call the <code class="code" id="e71da0fb_1486">anchor</code>.</p></dd></dl><aside class="prompt" data-type="tip" data-title="" id="e71da0fb_1487"><p id="e71da0fb_1488">All functions below will download the file if it doesn't exist locally. It also checks the hash of the file, thus will not redundantly download</p></aside><dl id="e71da0fb_1489" data-style="title-top"><dt id="e71da0fb_1490" data-expandable="false">download</dt><dd><p>Downloads a file from Google Cloud Storage and returns the local file path.</p></dd><dt id="e71da0fb_1491" data-expandable="false">open_file</dt><dd><p>Downloads and opens a file from Google Cloud Storage. Returns a file handle.</p></dd><dt id="e71da0fb_1492" data-expandable="false">open_image</dt><dd><p>Downloads and returns the PIL image from Google Cloud Storage.</p></dd></dl><section class="chapter"><h3 id="pathing" data-toc="pathing"   >Pathing</h3><p id="e71da0fb_1493">The path to specify is relative to the bucket, which is <code class="code" id="e71da0fb_1494">frdc-ds</code> by default.</p><p id="e71da0fb_1495">For example this filesystem on GCS:</p><div class="code-block" data-lang="none"         >
 # On Google Cloud Storage
 frdc-ds
 ├── chestnut_nature_park
 │   └── 20201218
 │       └── 90deg
 │           └── bounds.json
-</div><p id="573e5df3_2969">To download <code class="code" id="573e5df3_2970">bounds.json</code>, use <code class="code" id="573e5df3_2971">download(r&quot;chestnut_nature_park/20201218/90deg/bounds.json&quot;)</code>. By default, all files will be downloaded to <code class="code" id="573e5df3_2972">PROJ_DIR/rsc/...</code>.</p><div class="code-block" data-lang="none"         >
+</div><p id="e71da0fb_1497">To download <code class="code" id="e71da0fb_1498">bounds.json</code>, use <code class="code" id="e71da0fb_1499">download(r&quot;chestnut_nature_park/20201218/90deg/bounds.json&quot;)</code>. By default, all files will be downloaded to <code class="code" id="e71da0fb_1500">PROJ_DIR/rsc/...</code>.</p><div class="code-block" data-lang="none"         >
 # On local filesystem
 PROJ_DIR
 ├── rsc
@@ -13,4 +13,4 @@
 │       └── 20201218
 │           └── 90deg
 │               └── bounds.json
-</div></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="configuration" data-toc="configuration"   >Configuration</h3></div><div class="collapse__content"><p id="573e5df3_2974">If you need granular control over</p><ul class="list _ul" id="573e5df3_2975"><li class="list__item" id="573e5df3_2976"><p>where the files are downloaded</p></li><li class="list__item" id="573e5df3_2977"><p>the credentials used</p></li><li class="list__item" id="573e5df3_2978"><p>the project used</p></li><li class="list__item" id="573e5df3_2979"><p>the bucket used</p></li></ul><p id="573e5df3_2980">Then edit <code class="code" id="573e5df3_2981">conf.py</code>.</p><dl id="573e5df3_2982" data-style="title-top"><dt id="573e5df3_2983" data-expandable="false">GCS_CREDENTIALS</dt><dd><p><b id="573e5df3_2984">Google Cloud credentials.</b></p><br><p> A <code class="code" id="573e5df3_2986">google.oauth2.service_account.Credentials</code> object. See the object documentation for more information.</p></dd><dt id="573e5df3_2987" data-expandable="false">LOCAL_DATASET_ROOT_DIR</dt><dd><p><b id="573e5df3_2988">Local directory to download files to.</b></p><br><p> Path to a directory, or a <code class="code" id="573e5df3_2990">Path</code> object.</p></dd><dt id="573e5df3_2991" data-expandable="false">GCS_PROJECT_ID</dt><dd><p><b id="573e5df3_2992">Google Cloud project ID.</b></p><br></dd><dt id="573e5df3_2994" data-expandable="false">GCS_BUCKET_NAME</dt><dd><p><b id="573e5df3_2995">Google Cloud Storage bucket name.</b></p><br></dd></dl></div></div></section></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="load-dataset.html">load.dataset</a>   <a class="navigation-links__next" href="preprocessing-scale.html">preprocessing.scale</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="configuration" data-toc="configuration"   >Configuration</h3></div><div class="collapse__content"><p id="e71da0fb_1502">If you need granular control over</p><ul class="list _ul" id="e71da0fb_1503"><li class="list__item" id="e71da0fb_1504"><p>where the files are downloaded</p></li><li class="list__item" id="e71da0fb_1505"><p>the credentials used</p></li><li class="list__item" id="e71da0fb_1506"><p>the project used</p></li><li class="list__item" id="e71da0fb_1507"><p>the bucket used</p></li></ul><p id="e71da0fb_1508">Then edit <code class="code" id="e71da0fb_1509">conf.py</code>.</p><dl id="e71da0fb_1510" data-style="title-top"><dt id="e71da0fb_1511" data-expandable="false">GCS_CREDENTIALS</dt><dd><p><b id="e71da0fb_1512">Google Cloud credentials.</b></p><br><p> A <code class="code" id="e71da0fb_1514">google.oauth2.service_account.Credentials</code> object. See the object documentation for more information.</p></dd><dt id="e71da0fb_1515" data-expandable="false">LOCAL_DATASET_ROOT_DIR</dt><dd><p><b id="e71da0fb_1516">Local directory to download files to.</b></p><br><p> Path to a directory, or a <code class="code" id="e71da0fb_1518">Path</code> object.</p></dd><dt id="e71da0fb_1519" data-expandable="false">GCS_PROJECT_ID</dt><dd><p><b id="e71da0fb_1520">Google Cloud project ID.</b></p><br></dd><dt id="e71da0fb_1522" data-expandable="false">GCS_BUCKET_NAME</dt><dd><p><b id="e71da0fb_1523">Google Cloud Storage bucket name.</b></p><br></dd></dl></div></div></section></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="load-dataset.html">load.dataset</a>   <a class="navigation-links__next" href="preprocessing-scale.html">preprocessing.scale</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/mix-match-module.html b/docs/mix-match-module.html
index f622c5c5..9ef02365 100644
--- a/docs/mix-match-module.html
+++ b/docs/mix-match-module.html
@@ -1,4 +1,4 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>MixMatch Module | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"quick-recap","level":0,"title":"Quick Recap","anchor":"#quick-recap"},{"id":"mixmatch","level":0,"title":"MixMatch","anchor":"#mixmatch"},{"id":"design-choices","level":0,"title":"Design Choices","anchor":"#design-choices"},{"id":"references","level":0,"title":"References","anchor":"#references"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="MixMatch Module | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/mix-match-module.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="MixMatch Module | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/mix-match-module.html#webpage", "url": "/d/0.0.7/mix-match-module.html", "name": "MixMatch Module | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="mix-match-module" data-main-title="MixMatch Module" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="mix-match.md|MixMatch"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="mix-match-module"   id="mix-match-module.md">MixMatch Module</h1>  <p id="85c3129d_134">See <code class="code" id="85c3129d_135">frdc/train/mixmatch_module.py</code>.</p><section class="chapter"><h2 id="quick-recap" data-toc="quick-recap"   >Quick Recap</h2><p id="85c3129d_136">We will go over the essential parts of the code here. Before that, we revise some of the concepts that are used in the code.</p><section class="chapter"><h3 id="abstract-methods" data-toc="abstract-methods"   >Abstract Methods</h3><p id="85c3129d_137">In Python, we can define abstract methods using the <code class="code" id="85c3129d_138">abc</code> module. Just like other OOP languages, abstract methods are methods that must be implemented by the child class.</p><p id="85c3129d_139">For example:</p><div class="code-block" data-lang="python"         >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3926211"><meta name="build-number" content="${buildNumber}">       <title>MixMatch Module | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"quick-recap","level":0,"title":"Quick Recap","anchor":"#quick-recap"},{"id":"mixmatch","level":0,"title":"MixMatch","anchor":"#mixmatch"},{"id":"design-choices","level":0,"title":"Design Choices","anchor":"#design-choices"},{"id":"references","level":0,"title":"References","anchor":"#references"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="MixMatch Module | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/mix-match-module.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="MixMatch Module | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/mix-match-module.html#webpage", "url": "/d/0.0.8/mix-match-module.html", "name": "MixMatch Module | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="mix-match-module" data-main-title="MixMatch Module" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="mix-match.md|MixMatch"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="mix-match-module"   id="mix-match-module.md">MixMatch Module</h1>  <p id="9934f4e1_187">See <code class="code" id="9934f4e1_188">frdc/train/mixmatch_module.py</code>.</p><section class="chapter"><h2 id="quick-recap" data-toc="quick-recap"   >Quick Recap</h2><p id="9934f4e1_189">We will go over the essential parts of the code here. Before that, we revise some of the concepts that are used in the code.</p><section class="chapter"><h3 id="abstract-methods" data-toc="abstract-methods"   >Abstract Methods</h3><p id="9934f4e1_190">In Python, we can define abstract methods using the <code class="code" id="9934f4e1_191">abc</code> module. Just like other OOP languages, abstract methods are methods that must be implemented by the child class.</p><p id="9934f4e1_192">For example:</p><div class="code-block" data-lang="python"         >
 from abc import ABC, abstractmethod
 
 
@@ -11,7 +11,7 @@
 class MyChildClass(MyAbstractClass):
     def my_abstract_method(self):
         print(&quot;Hello World!&quot;)
-</div></section><section class="chapter"><h3 id="nn-module-lightningmodule" data-toc="nn-module-lightningmodule"   >nn.Module &amp; LightningModule</h3><p id="85c3129d_141">If you're unfamiliar with PyTorch, you should read the <a href="https://pytorch.org/docs/stable/generated/torch.nn.Module.html" id="85c3129d_142"   data-external="true" rel="noopener noreferrer" >nn.Module Documentation</a>.</p><p id="85c3129d_143"><code class="code" id="85c3129d_144">nn.Module</code> is the base class for all neural network modules in PyTorch. While <code class="code" id="85c3129d_145">LightningModule</code> is a PyTorch Lightning class that extends <code class="code" id="85c3129d_146">nn.Module</code>, providing it with additional functionality that reduces boilerplate code.</p><p id="85c3129d_147">By implementing it as a <code class="code" id="85c3129d_148">LightningModule</code>, we also enter the PyTorch Lightning ecosystem, which provides us with a lot of useful features such as logging, early stopping, and more.</p><section class="chapter"><h4 id="what-do-we-implement-in-a-module" data-toc="what-do-we-implement-in-a-module"   >What do we implement in a Module?</h4><p id="85c3129d_149">One key component that <code class="code" id="85c3129d_150">nn.Module</code> requires, is the model. So for example:</p><div class="code-block" data-lang="python"         >
+</div></section><section class="chapter"><h3 id="nn-module-lightningmodule" data-toc="nn-module-lightningmodule"   >nn.Module &amp; LightningModule</h3><p id="9934f4e1_194">If you're unfamiliar with PyTorch, you should read the <a href="https://pytorch.org/docs/stable/generated/torch.nn.Module.html" id="9934f4e1_195"   data-external="true" rel="noopener noreferrer" >nn.Module Documentation</a>.</p><p id="9934f4e1_196"><code class="code" id="9934f4e1_197">nn.Module</code> is the base class for all neural network modules in PyTorch. While <code class="code" id="9934f4e1_198">LightningModule</code> is a PyTorch Lightning class that extends <code class="code" id="9934f4e1_199">nn.Module</code>, providing it with additional functionality that reduces boilerplate code.</p><p id="9934f4e1_200">By implementing it as a <code class="code" id="9934f4e1_201">LightningModule</code>, we also enter the PyTorch Lightning ecosystem, which provides us with a lot of useful features such as logging, early stopping, and more.</p><section class="chapter"><h4 id="what-do-we-implement-in-a-module" data-toc="what-do-we-implement-in-a-module"   >What do we implement in a Module?</h4><p id="9934f4e1_202">One key component that <code class="code" id="9934f4e1_203">nn.Module</code> requires, is the model. So for example:</p><div class="code-block" data-lang="python"         >
 class MyModule(nn.Module):
     def __init__(self):
         super().__init__()
@@ -23,7 +23,7 @@
 
     def forward(self, x):
         return self.model(x)
-</div><p id="85c3129d_152">PyTorch Lightning builds on top of it, requiring <code class="code" id="85c3129d_153">training_step</code> and <code class="code" id="85c3129d_154">validation_step</code>. Each &quot;step&quot; is a batch of data, and the model is trained on it. So for example:</p><div class="code-block" data-lang="python"         >
+</div><p id="9934f4e1_205">PyTorch Lightning builds on top of it, requiring <code class="code" id="9934f4e1_206">training_step</code> and <code class="code" id="9934f4e1_207">validation_step</code>. Each &quot;step&quot; is a batch of data, and the model is trained on it. So for example:</p><div class="code-block" data-lang="python"         >
 class MyModule(LightningModule):
     def __init__(self): ...
 
@@ -40,7 +40,7 @@
         y_hat = self(x)
         loss = F.cross_entropy(y_hat, y)
         return loss
-</div><p id="85c3129d_156">Usually, the training and validation steps are the same, but in some cases, such as MixMatch, they are different. In MixMatch, we not only use a different loss function for train, we also handle a batch differently. The PyTorch Lightning framework allows us to separate the two, and implement them separately.</p></section></section><section class="chapter"><h3 id="model-embedded-preprocessing-on-before-batch-transfer" data-toc="model-embedded-preprocessing-on-before-batch-transfer"   >Model Embedded Preprocessing on_before_batch_transfer</h3><p id="85c3129d_157">In PyTorch Lightning, we can also inject a step before the batch is passed to the model. This is done by overriding the <code class="code" id="85c3129d_158">on_before_batch_transfer</code> method.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 498.375 134"  xmlns="http://www.w3.org/2000/svg" width="498.375" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M55.46875,59L59.635416666666664,59C63.802083333333336,59,72.13541666666667,59,80.46875,59C88.80208333333333,59,97.13541666666667,59,101.30208333333333,59L105.46875,59"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M257.4468005952381,42L269.94525049603175,37.833333333333336C282.44370039682536,33.666666666666664,307.4406001984127,25.333333333333332,325.394779265873,21.166666666666668C343.3489583333333,17,354.2604166666667,17,359.7161458333333,17L365.171875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-D" id="L-B-D-0" d="M257.4468005952381,76L269.94525049603175,80.16666666666667C282.44370039682536,84.33333333333333,307.4406001984127,92.66666666666667,324.105716765873,96.83333333333333C340.7708333333333,101,349.1041666666667,101,353.2708333333333,101L357.4375,101"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(27.734375, 59)" id="flowchart-A-108" class="node default default flowchart-label"><rect height="34" width="55.46875" y="-17" x="-27.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-20.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="40.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Batch</span></div></foreignObject></g></g><g transform="translate(206.453125, 59)" id="flowchart-B-109" class="node default default flowchart-label"><rect height="34" width="201.96875" y="-17" x="-100.984375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-93.484375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="186.96875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_before_batch_transfer</span></div></foreignObject></g></g><g transform="translate(419.90625, 17)" id="flowchart-C-111" class="node default default flowchart-label"><rect height="34" width="109.46875" y="-17" x="-54.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="94.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">training_step</span></div></foreignObject></g></g><g transform="translate(419.90625, 101)" id="flowchart-D-113" class="node default default flowchart-label"><rect height="34" width="124.9375" y="-17" x="-62.46875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-54.96875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="109.9375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">validation_step</span></div></foreignObject></g></g></g></g></g></svg><aside class="prompt" data-type="tip" data-title="" id="85c3129d_160"><p id="85c3129d_161"><code class="code" id="85c3129d_162">before</code> means it is done before the batch is transferred to the GPU</p></aside><p id="85c3129d_163">This allows us to do preprocessing on the batch, such as scaling the data, encoding the labels, and more.</p></section><section class="chapter"><h3 id="custom-ema-update-on-after-backward" data-toc="custom-ema-update-on-after-backward"   >Custom EMA Update on_after_backward</h3><p id="85c3129d_164">We also leverage another hook, called <code class="code" id="85c3129d_165">on_after_backward</code>. This hook is called after the backward pass, and allows us to do custom operations. In our case, we use it to update the EMA model.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 588.28125 50"  xmlns="http://www.w3.org/2000/svg" width="588.28125" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-C" id="L-A-C-0" d="M55.46875,17L59.635416666666664,17C63.802083333333336,17,72.13541666666667,17,80.46875,17C88.80208333333333,17,97.13541666666667,17,101.30208333333333,17L105.46875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M214.9375,17L219.10416666666666,17C223.27083333333334,17,231.60416666666666,17,239.9375,17C248.27083333333334,17,256.6041666666667,17,260.7708333333333,17L264.9375,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-D LE-E" id="L-D-E-0" d="M418.421875,17L422.5885416666667,17C426.7552083333333,17,435.0885416666667,17,443.421875,17C451.7552083333333,17,460.0885416666667,17,464.2552083333333,17L468.421875,17"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(27.734375, 17)" id="flowchart-A-162" class="node default default flowchart-label"><rect height="34" width="55.46875" y="-17" x="-27.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-20.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="40.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Batch</span></div></foreignObject></g></g><g transform="translate(160.203125, 17)" id="flowchart-C-163" class="node default default flowchart-label"><rect height="34" width="109.46875" y="-17" x="-54.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="94.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">training_step</span></div></foreignObject></g></g><g transform="translate(341.6796875, 17)" id="flowchart-D-165" class="node default default flowchart-label"><rect height="34" width="153.484375" y="-17" x="-76.7421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-69.2421875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="138.484375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_after_backward</span></div></foreignObject></g></g><g transform="translate(520.3515625, 17)" id="flowchart-E-167" class="node default default flowchart-label"><rect height="34" width="103.859375" y="-17" x="-51.9296875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-44.4296875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="88.859375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">update_ema</span></div></foreignObject></g></g></g></g></g></svg></section></section><section class="chapter"><h2 id="mixmatch" data-toc="mixmatch"   >MixMatch</h2><p id="85c3129d_167">We recommend having <code class="code" id="85c3129d_168">tests/model_tests/chestnut_dec_may/train.py</code> open while reading this section. It implements a real-world example of MixMatch.</p><p id="85c3129d_169">As a summary:</p><ol class="list _decimal" id="85c3129d_170" type="1"><li class="list__item" id="85c3129d_171"><p>We learned what is an abstract method, and how to implement it</p></li><li class="list__item" id="85c3129d_172"><p>We implement the model in <code class="code" id="85c3129d_173">LightningModule</code> much like we would in <code class="code" id="85c3129d_174">nn.Module</code></p></li><li class="list__item" id="85c3129d_175"><p>We implement <code class="code" id="85c3129d_176">on_before_batch_transfer</code> to preprocess the batch</p></li><li class="list__item" id="85c3129d_177"><p>Finally, we implement <code class="code" id="85c3129d_178">on_after_backward</code> to update the EMA model</p></li></ol><p id="85c3129d_179">With the above in mind, let's look at the MixMatch implementation.</p><dl id="85c3129d_180" data-style="title-top"><dt id="85c3129d_181" data-expandable="false">forward (abstract)</dt><dd><p id="85c3129d_182">Forward pass of the model</p></dd><dt id="85c3129d_183" data-expandable="false">ema_model (abstract)</dt><dd><p id="85c3129d_184">The model that is used for EMA. We expect this property to be implemented by the child class.</p></dd><dt id="85c3129d_185" data-expandable="false">update_ema (abstract)</dt><dd><p id="85c3129d_186">The method to update the EMA model. We expect this method to be implemented by the child class.</p></dd><dt id="85c3129d_187" data-expandable="false">loss_unl_scaler (static)</dt><dd><p id="85c3129d_188">Takes in the current progress of the training, 0.0 to 1.0, where 0.0 is the start of the training, and 1.0 is the end. Then, returns the multiplier for the unlabeled loss.</p></dd><dt id="85c3129d_189" data-expandable="false">loss_lbl (static)</dt><dd><p id="85c3129d_190">Implements the loss for labeled data. Takes in the predicted labels and the ground truth labels, and returns the loss. This is cross entropy for MixMatch.</p></dd><dt id="85c3129d_191" data-expandable="false">loss_unl (static)</dt><dd><p id="85c3129d_192">Implements the loss for unlabeled data. Takes in the predicted labels and the ground truth labels, and returns the loss. This is MSE for MixMatch.</p></dd><dt id="85c3129d_193" data-expandable="false">mixup</dt><dd><p id="85c3129d_194">Takes in the data and the labels, the beta distribution parameter, and returns the mixed data and labels.</p></dd><dt id="85c3129d_195" data-expandable="false">sharpen</dt><dd><p id="85c3129d_196">Takes in the labels and temperature, and returns the sharpened labels.</p></dd><dt id="85c3129d_197" data-expandable="false">guess_labels</dt><dd><p id="85c3129d_198">Takes in the unlabeled data, and returns the guessed labels.</p></dd><dt id="85c3129d_199" data-expandable="false">progress</dt><dd><p id="85c3129d_200">The current progress of the training, 0.0 to 1.0, where 0.0 is the start of the training, and 1.0 is the end.</p></dd><dt id="85c3129d_201" data-expandable="false">training_step</dt><dd><p id="85c3129d_202">The training step runs through 1 batch of data, and returns the loss. Note that this is significantly different from validation step, as we handle the K-Augmented data differently.</p></dd><dt id="85c3129d_203" data-expandable="false">test / validation_step</dt><dd><p id="85c3129d_204">The test / validation step runs through 1 batch of data, and returns the loss.</p></dd><dt id="85c3129d_205" data-expandable="false">predict_step</dt><dd><p id="85c3129d_206">The predict step runs through 1 batch of data, and returns the actual decoded labels.</p></dd><dt id="85c3129d_207" data-expandable="false">on_after_backward</dt><dd><p id="85c3129d_208">The on_after_backward hook is called after the backward pass, and allows us to do custom operations. In our case, we use it to update the EMA model.</p></dd><dt id="85c3129d_209" data-expandable="false">on_before_batch_transfer</dt><dd><p id="85c3129d_210">The on_before_batch_transfer hook is called before the batch is transferred to the GPU. In our case, we use it to preprocess the batch.</p></dd></dl><p id="85c3129d_211">A diagram of how these components interact with each other is shown below:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 379.7109375 974"  xmlns="http://www.w3.org/2000/svg" width="379.7109375" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M217.640625,34L217.640625,38.166666666666664C217.640625,42.333333333333336,217.640625,50.666666666666664,217.640625,59C217.640625,67.33333333333333,217.640625,75.66666666666667,217.640625,79.83333333333333L217.640625,84"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M183.80189732142856,118L175.5080915178571,122.16666666666667C167.2142857142857,126.33333333333333,150.62667410714286,134.66666666666666,142.33286830357142,143C134.0390625,151.33333333333334,134.0390625,159.66666666666666,134.0390625,163.83333333333334L134.0390625,168"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-F" id="L-C-F-0" d="M134.0390625,202L134.0390625,206.16666666666666C134.0390625,210.33333333333334,134.0390625,218.66666666666666,134.0390625,227C134.0390625,235.33333333333334,134.0390625,243.66666666666666,134.0390625,247.83333333333334L134.0390625,252"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-F LE-G" id="L-F-G-0" d="M134.0390625,286L134.0390625,290.1666666666667C134.0390625,294.3333333333333,134.0390625,302.6666666666667,134.0390625,311C134.0390625,319.3333333333333,134.0390625,327.6666666666667,134.0390625,331.8333333333333L134.0390625,336"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-G LE-H" id="L-G-H-0" d="M134.0390625,370L134.0390625,374.1666666666667C134.0390625,378.3333333333333,134.0390625,386.6666666666667,134.0390625,395C134.0390625,403.3333333333333,134.0390625,411.6666666666667,134.0390625,415.8333333333333L134.0390625,420"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-H LE-I" id="L-H-I-0" d="M104.62109375,454L97.41080729166667,458.1666666666667C90.20052083333333,462.3333333333333,75.77994791666667,470.6666666666667,68.56966145833333,479C61.359375,487.3333333333333,61.359375,495.6666666666667,61.359375,499.8333333333333L61.359375,504"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-I LE-J" id="L-I-J-0" d="M61.359375,538L61.359375,542.1666666666666C61.359375,546.3333333333334,61.359375,554.6666666666666,61.359375,563C61.359375,571.3333333333334,61.359375,579.6666666666666,61.359375,583.8333333333334L61.359375,588"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-J LE-L" id="L-J-L-0" d="M61.359375,622L61.359375,626.1666666666666C61.359375,630.3333333333334,61.359375,638.6666666666666,70.03385416666667,647.8461249059443C78.70833333333333,657.025583145222,96.05729166666667,667.0511662904439,104.73177083333333,672.063957863055L113.40625,677.0767494356659"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-H LE-k" id="L-H-k-0" d="M163.45703125,454L170.66731770833334,458.1666666666667C177.87760416666666,462.3333333333333,192.29817708333334,470.6666666666667,199.50846354166666,481.8333333333333C206.71875,493,206.71875,507,206.71875,521C206.71875,535,206.71875,549,206.71875,560.1666666666666C206.71875,571.3333333333334,206.71875,579.6666666666666,206.71875,583.8333333333334L206.71875,588"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-k LE-L" id="L-k-L-0" d="M206.71875,622L206.71875,626.1666666666666C206.71875,630.3333333333334,206.71875,638.6666666666666,198.04427083333334,647.8461249059443C189.36979166666666,657.025583145222,172.02083333333334,667.0511662904439,163.34635416666666,672.063957863055L154.671875,677.0767494356659"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-L LE-M" id="L-L-M-0" d="M134.0390625,706L134.0390625,710.1666666666666C134.0390625,714.3333333333334,134.0390625,722.6666666666666,134.0390625,731C134.0390625,739.3333333333334,134.0390625,747.6666666666666,134.0390625,751.8333333333334L134.0390625,756"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-M LE-D" id="L-M-D-0" d="M134.0390625,790L134.0390625,794.1666666666666C134.0390625,798.3333333333334,134.0390625,806.6666666666666,134.0390625,815C134.0390625,823.3333333333334,134.0390625,831.6666666666666,134.0390625,835.8333333333334L134.0390625,840"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-D LE-E" id="L-D-E-0" d="M134.0390625,874L134.0390625,878.1666666666666C134.0390625,882.3333333333334,134.0390625,890.6666666666666,134.0390625,899C134.0390625,907.3333333333334,134.0390625,915.6666666666666,134.0390625,919.8333333333334L134.0390625,924"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-VC" id="L-B-VC-0" d="M251.47935267857144,118L259.7731584821429,122.16666666666667C268.0669642857143,126.33333333333333,284.65457589285717,134.66666666666666,292.9483816964286,143C301.2421875,151.33333333333334,301.2421875,159.66666666666666,301.2421875,163.83333333333334L301.2421875,168"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-VC LE-VL" id="L-VC-VL-0" d="M301.2421875,202L301.2421875,206.16666666666666C301.2421875,210.33333333333334,301.2421875,218.66666666666666,301.2421875,227C301.2421875,235.33333333333334,301.2421875,243.66666666666666,301.2421875,247.83333333333334L301.2421875,252"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(217.640625, 17)" id="flowchart-A-240" class="node default default flowchart-label"><rect height="34" width="55.46875" y="-17" x="-27.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-20.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="40.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Batch</span></div></foreignObject></g></g><g transform="translate(217.640625, 101)" id="flowchart-B-241" class="node default default flowchart-label"><rect height="34" width="201.96875" y="-17" x="-100.984375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-93.484375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="186.96875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_before_batch_transfer</span></div></foreignObject></g></g><g transform="translate(134.0390625, 185)" id="flowchart-C-243" class="node default default flowchart-label"><rect height="34" width="109.46875" y="-17" x="-54.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="94.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">training_step</span></div></foreignObject></g></g><g transform="translate(134.0390625, 269)" id="flowchart-F-244" class="node default default flowchart-label"><rect height="34" width="103.8125" y="-17" x="-51.90625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-44.40625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="88.8125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">guess_labels</span></div></foreignObject></g></g><g transform="translate(134.0390625, 353)" id="flowchart-G-245" class="node default default flowchart-label"><rect height="34" width="71.234375" y="-17" x="-35.6171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-28.1171875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="56.234375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">sharpen</span></div></foreignObject></g></g><g transform="translate(134.0390625, 437)" id="flowchart-H-246" class="node default default flowchart-label"><rect height="34" width="66.90625" y="-17" x="-33.453125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-25.953125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="51.90625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">mix_up</span></div></foreignObject></g></g><g transform="translate(61.359375, 521)" id="flowchart-I-247" class="node default default flowchart-label"><rect height="34" width="71.859375" y="-17" x="-35.9296875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-28.4296875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="56.859375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss_unl</span></div></foreignObject></g></g><g transform="translate(61.359375, 605)" id="flowchart-J-248" class="node default default flowchart-label"><rect height="34" width="122.71875" y="-17" x="-61.359375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-53.859375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="107.71875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss_unl_scaler</span></div></foreignObject></g></g><g transform="translate(134.0390625, 689)" id="flowchart-L-249" class="node default default flowchart-label"><rect height="34" width="41.265625" y="-17" x="-20.6328125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-13.1328125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="26.265625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss</span></div></foreignObject></g></g><g transform="translate(206.71875, 605)" id="flowchart-k-251" class="node default default flowchart-label"><rect height="34" width="68" y="-17" x="-34" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-26.5, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="53"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss_lbl</span></div></foreignObject></g></g><g transform="translate(134.0390625, 773)" id="flowchart-M-253" class="node default default flowchart-label"><rect height="34" width="83.765625" y="-17" x="-41.8828125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-34.3828125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="68.765625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">backward</span></div></foreignObject></g></g><g transform="translate(134.0390625, 857)" id="flowchart-D-255" class="node default default flowchart-label"><rect height="34" width="153.484375" y="-17" x="-76.7421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-69.2421875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="138.484375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_after_backward</span></div></foreignObject></g></g><g transform="translate(134.0390625, 941)" id="flowchart-E-257" class="node default default flowchart-label"><rect height="34" width="103.859375" y="-17" x="-51.9296875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-44.4296875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="88.859375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">update_ema</span></div></foreignObject></g></g><g transform="translate(301.2421875, 185)" id="flowchart-VC-259" class="node default default flowchart-label"><rect height="34" width="124.9375" y="-17" x="-62.46875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-54.96875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="109.9375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">validation_step</span></div></foreignObject></g></g><g transform="translate(301.2421875, 269)" id="flowchart-VL-260" class="node default default flowchart-label"><rect height="34" width="41.265625" y="-17" x="-20.6328125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-13.1328125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="26.265625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss</span></div></foreignObject></g></g></g></g></g></svg><p id="85c3129d_213">Finally, we show an example of how to use the MixMatch module:</p><div class="code-block" data-lang="python"         >
+</div><p id="9934f4e1_209">Usually, the training and validation steps are the same, but in some cases, such as MixMatch, they are different. In MixMatch, we not only use a different loss function for train, we also handle a batch differently. The PyTorch Lightning framework allows us to separate the two, and implement them separately.</p></section></section><section class="chapter"><h3 id="model-embedded-preprocessing-on-before-batch-transfer" data-toc="model-embedded-preprocessing-on-before-batch-transfer"   >Model Embedded Preprocessing on_before_batch_transfer</h3><p id="9934f4e1_210">In PyTorch Lightning, we can also inject a step before the batch is passed to the model. This is done by overriding the <code class="code" id="9934f4e1_211">on_before_batch_transfer</code> method.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 498.375 134"  xmlns="http://www.w3.org/2000/svg" width="498.375" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M55.46875,59L59.635416666666664,59C63.802083333333336,59,72.13541666666667,59,80.46875,59C88.80208333333333,59,97.13541666666667,59,101.30208333333333,59L105.46875,59"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M257.4468005952381,42L269.94525049603175,37.833333333333336C282.44370039682536,33.666666666666664,307.4406001984127,25.333333333333332,325.394779265873,21.166666666666668C343.3489583333333,17,354.2604166666667,17,359.7161458333333,17L365.171875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-D" id="L-B-D-0" d="M257.4468005952381,76L269.94525049603175,80.16666666666667C282.44370039682536,84.33333333333333,307.4406001984127,92.66666666666667,324.105716765873,96.83333333333333C340.7708333333333,101,349.1041666666667,101,353.2708333333333,101L357.4375,101"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(27.734375, 59)" id="flowchart-A-12" class="node default default flowchart-label"><rect height="34" width="55.46875" y="-17" x="-27.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-20.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="40.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Batch</span></div></foreignObject></g></g><g transform="translate(206.453125, 59)" id="flowchart-B-13" class="node default default flowchart-label"><rect height="34" width="201.96875" y="-17" x="-100.984375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-93.484375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="186.96875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_before_batch_transfer</span></div></foreignObject></g></g><g transform="translate(419.90625, 17)" id="flowchart-C-15" class="node default default flowchart-label"><rect height="34" width="109.46875" y="-17" x="-54.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="94.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">training_step</span></div></foreignObject></g></g><g transform="translate(419.90625, 101)" id="flowchart-D-17" class="node default default flowchart-label"><rect height="34" width="124.9375" y="-17" x="-62.46875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-54.96875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="109.9375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">validation_step</span></div></foreignObject></g></g></g></g></g></svg><aside class="prompt" data-type="tip" data-title="" id="9934f4e1_213"><p id="9934f4e1_214"><code class="code" id="9934f4e1_215">before</code> means it is done before the batch is transferred to the GPU</p></aside><p id="9934f4e1_216">This allows us to do preprocessing on the batch, such as scaling the data, encoding the labels, and more.</p></section><section class="chapter"><h3 id="custom-ema-update-on-after-backward" data-toc="custom-ema-update-on-after-backward"   >Custom EMA Update on_after_backward</h3><p id="9934f4e1_217">We also leverage another hook, called <code class="code" id="9934f4e1_218">on_after_backward</code>. This hook is called after the backward pass, and allows us to do custom operations. In our case, we use it to update the EMA model.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 588.28125 50"  xmlns="http://www.w3.org/2000/svg" width="588.28125" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-C" id="L-A-C-0" d="M55.46875,17L59.635416666666664,17C63.802083333333336,17,72.13541666666667,17,80.46875,17C88.80208333333333,17,97.13541666666667,17,101.30208333333333,17L105.46875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M214.9375,17L219.10416666666666,17C223.27083333333334,17,231.60416666666666,17,239.9375,17C248.27083333333334,17,256.6041666666667,17,260.7708333333333,17L264.9375,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-D LE-E" id="L-D-E-0" d="M418.421875,17L422.5885416666667,17C426.7552083333333,17,435.0885416666667,17,443.421875,17C451.7552083333333,17,460.0885416666667,17,464.2552083333333,17L468.421875,17"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(27.734375, 17)" id="flowchart-A-132" class="node default default flowchart-label"><rect height="34" width="55.46875" y="-17" x="-27.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-20.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="40.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Batch</span></div></foreignObject></g></g><g transform="translate(160.203125, 17)" id="flowchart-C-133" class="node default default flowchart-label"><rect height="34" width="109.46875" y="-17" x="-54.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="94.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">training_step</span></div></foreignObject></g></g><g transform="translate(341.6796875, 17)" id="flowchart-D-135" class="node default default flowchart-label"><rect height="34" width="153.484375" y="-17" x="-76.7421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-69.2421875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="138.484375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_after_backward</span></div></foreignObject></g></g><g transform="translate(520.3515625, 17)" id="flowchart-E-137" class="node default default flowchart-label"><rect height="34" width="103.859375" y="-17" x="-51.9296875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-44.4296875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="88.859375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">update_ema</span></div></foreignObject></g></g></g></g></g></svg></section></section><section class="chapter"><h2 id="mixmatch" data-toc="mixmatch"   >MixMatch</h2><p id="9934f4e1_220">We recommend having <code class="code" id="9934f4e1_221">tests/model_tests/chestnut_dec_may/train.py</code> open while reading this section. It implements a real-world example of MixMatch.</p><p id="9934f4e1_222">As a summary:</p><ol class="list _decimal" id="9934f4e1_223" type="1"><li class="list__item" id="9934f4e1_224"><p>We learned what is an abstract method, and how to implement it</p></li><li class="list__item" id="9934f4e1_225"><p>We implement the model in <code class="code" id="9934f4e1_226">LightningModule</code> much like we would in <code class="code" id="9934f4e1_227">nn.Module</code></p></li><li class="list__item" id="9934f4e1_228"><p>We implement <code class="code" id="9934f4e1_229">on_before_batch_transfer</code> to preprocess the batch</p></li><li class="list__item" id="9934f4e1_230"><p>Finally, we implement <code class="code" id="9934f4e1_231">on_after_backward</code> to update the EMA model</p></li></ol><p id="9934f4e1_232">With the above in mind, let's look at the MixMatch implementation.</p><dl id="9934f4e1_233" data-style="title-top"><dt id="9934f4e1_234" data-expandable="false">forward (abstract)</dt><dd><p id="9934f4e1_235">Forward pass of the model</p></dd><dt id="9934f4e1_236" data-expandable="false">ema_model (abstract)</dt><dd><p id="9934f4e1_237">The model that is used for EMA. We expect this property to be implemented by the child class.</p></dd><dt id="9934f4e1_238" data-expandable="false">update_ema (abstract)</dt><dd><p id="9934f4e1_239">The method to update the EMA model. We expect this method to be implemented by the child class.</p></dd><dt id="9934f4e1_240" data-expandable="false">loss_unl_scaler (static)</dt><dd><p id="9934f4e1_241">Takes in the current progress of the training, 0.0 to 1.0, where 0.0 is the start of the training, and 1.0 is the end. Then, returns the multiplier for the unlabeled loss.</p></dd><dt id="9934f4e1_242" data-expandable="false">loss_lbl (static)</dt><dd><p id="9934f4e1_243">Implements the loss for labeled data. Takes in the predicted labels and the ground truth labels, and returns the loss. This is cross entropy for MixMatch.</p></dd><dt id="9934f4e1_244" data-expandable="false">loss_unl (static)</dt><dd><p id="9934f4e1_245">Implements the loss for unlabeled data. Takes in the predicted labels and the ground truth labels, and returns the loss. This is MSE for MixMatch.</p></dd><dt id="9934f4e1_246" data-expandable="false">mixup</dt><dd><p id="9934f4e1_247">Takes in the data and the labels, the beta distribution parameter, and returns the mixed data and labels.</p></dd><dt id="9934f4e1_248" data-expandable="false">sharpen</dt><dd><p id="9934f4e1_249">Takes in the labels and temperature, and returns the sharpened labels.</p></dd><dt id="9934f4e1_250" data-expandable="false">guess_labels</dt><dd><p id="9934f4e1_251">Takes in the unlabeled data, and returns the guessed labels.</p></dd><dt id="9934f4e1_252" data-expandable="false">progress</dt><dd><p id="9934f4e1_253">The current progress of the training, 0.0 to 1.0, where 0.0 is the start of the training, and 1.0 is the end.</p></dd><dt id="9934f4e1_254" data-expandable="false">training_step</dt><dd><p id="9934f4e1_255">The training step runs through 1 batch of data, and returns the loss. Note that this is significantly different from validation step, as we handle the K-Augmented data differently.</p></dd><dt id="9934f4e1_256" data-expandable="false">test / validation_step</dt><dd><p id="9934f4e1_257">The test / validation step runs through 1 batch of data, and returns the loss.</p></dd><dt id="9934f4e1_258" data-expandable="false">predict_step</dt><dd><p id="9934f4e1_259">The predict step runs through 1 batch of data, and returns the actual decoded labels.</p></dd><dt id="9934f4e1_260" data-expandable="false">on_after_backward</dt><dd><p id="9934f4e1_261">The on_after_backward hook is called after the backward pass, and allows us to do custom operations. In our case, we use it to update the EMA model.</p></dd><dt id="9934f4e1_262" data-expandable="false">on_before_batch_transfer</dt><dd><p id="9934f4e1_263">The on_before_batch_transfer hook is called before the batch is transferred to the GPU. In our case, we use it to preprocess the batch.</p></dd></dl><p id="9934f4e1_264">A diagram of how these components interact with each other is shown below:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 379.7109375 974"  xmlns="http://www.w3.org/2000/svg" width="379.7109375" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M217.640625,34L217.640625,38.166666666666664C217.640625,42.333333333333336,217.640625,50.666666666666664,217.640625,59C217.640625,67.33333333333333,217.640625,75.66666666666667,217.640625,79.83333333333333L217.640625,84"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M183.80189732142856,118L175.5080915178571,122.16666666666667C167.2142857142857,126.33333333333333,150.62667410714286,134.66666666666666,142.33286830357142,143C134.0390625,151.33333333333334,134.0390625,159.66666666666666,134.0390625,163.83333333333334L134.0390625,168"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-F" id="L-C-F-0" d="M134.0390625,202L134.0390625,206.16666666666666C134.0390625,210.33333333333334,134.0390625,218.66666666666666,134.0390625,227C134.0390625,235.33333333333334,134.0390625,243.66666666666666,134.0390625,247.83333333333334L134.0390625,252"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-F LE-G" id="L-F-G-0" d="M134.0390625,286L134.0390625,290.1666666666667C134.0390625,294.3333333333333,134.0390625,302.6666666666667,134.0390625,311C134.0390625,319.3333333333333,134.0390625,327.6666666666667,134.0390625,331.8333333333333L134.0390625,336"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-G LE-H" id="L-G-H-0" d="M134.0390625,370L134.0390625,374.1666666666667C134.0390625,378.3333333333333,134.0390625,386.6666666666667,134.0390625,395C134.0390625,403.3333333333333,134.0390625,411.6666666666667,134.0390625,415.8333333333333L134.0390625,420"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-H LE-I" id="L-H-I-0" d="M104.62109375,454L97.41080729166667,458.1666666666667C90.20052083333333,462.3333333333333,75.77994791666667,470.6666666666667,68.56966145833333,479C61.359375,487.3333333333333,61.359375,495.6666666666667,61.359375,499.8333333333333L61.359375,504"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-I LE-J" id="L-I-J-0" d="M61.359375,538L61.359375,542.1666666666666C61.359375,546.3333333333334,61.359375,554.6666666666666,61.359375,563C61.359375,571.3333333333334,61.359375,579.6666666666666,61.359375,583.8333333333334L61.359375,588"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-J LE-L" id="L-J-L-0" d="M61.359375,622L61.359375,626.1666666666666C61.359375,630.3333333333334,61.359375,638.6666666666666,70.03385416666667,647.8461249059443C78.70833333333333,657.025583145222,96.05729166666667,667.0511662904439,104.73177083333333,672.063957863055L113.40625,677.0767494356659"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-H LE-k" id="L-H-k-0" d="M163.45703125,454L170.66731770833334,458.1666666666667C177.87760416666666,462.3333333333333,192.29817708333334,470.6666666666667,199.50846354166666,481.8333333333333C206.71875,493,206.71875,507,206.71875,521C206.71875,535,206.71875,549,206.71875,560.1666666666666C206.71875,571.3333333333334,206.71875,579.6666666666666,206.71875,583.8333333333334L206.71875,588"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-k LE-L" id="L-k-L-0" d="M206.71875,622L206.71875,626.1666666666666C206.71875,630.3333333333334,206.71875,638.6666666666666,198.04427083333334,647.8461249059443C189.36979166666666,657.025583145222,172.02083333333334,667.0511662904439,163.34635416666666,672.063957863055L154.671875,677.0767494356659"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-L LE-M" id="L-L-M-0" d="M134.0390625,706L134.0390625,710.1666666666666C134.0390625,714.3333333333334,134.0390625,722.6666666666666,134.0390625,731C134.0390625,739.3333333333334,134.0390625,747.6666666666666,134.0390625,751.8333333333334L134.0390625,756"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-M LE-D" id="L-M-D-0" d="M134.0390625,790L134.0390625,794.1666666666666C134.0390625,798.3333333333334,134.0390625,806.6666666666666,134.0390625,815C134.0390625,823.3333333333334,134.0390625,831.6666666666666,134.0390625,835.8333333333334L134.0390625,840"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-D LE-E" id="L-D-E-0" d="M134.0390625,874L134.0390625,878.1666666666666C134.0390625,882.3333333333334,134.0390625,890.6666666666666,134.0390625,899C134.0390625,907.3333333333334,134.0390625,915.6666666666666,134.0390625,919.8333333333334L134.0390625,924"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-VC" id="L-B-VC-0" d="M251.47935267857144,118L259.7731584821429,122.16666666666667C268.0669642857143,126.33333333333333,284.65457589285717,134.66666666666666,292.9483816964286,143C301.2421875,151.33333333333334,301.2421875,159.66666666666666,301.2421875,163.83333333333334L301.2421875,168"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-VC LE-VL" id="L-VC-VL-0" d="M301.2421875,202L301.2421875,206.16666666666666C301.2421875,210.33333333333334,301.2421875,218.66666666666666,301.2421875,227C301.2421875,235.33333333333334,301.2421875,243.66666666666666,301.2421875,247.83333333333334L301.2421875,252"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(217.640625, 17)" id="flowchart-A-228" class="node default default flowchart-label"><rect height="34" width="55.46875" y="-17" x="-27.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-20.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="40.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Batch</span></div></foreignObject></g></g><g transform="translate(217.640625, 101)" id="flowchart-B-229" class="node default default flowchart-label"><rect height="34" width="201.96875" y="-17" x="-100.984375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-93.484375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="186.96875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_before_batch_transfer</span></div></foreignObject></g></g><g transform="translate(134.0390625, 185)" id="flowchart-C-231" class="node default default flowchart-label"><rect height="34" width="109.46875" y="-17" x="-54.734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-47.234375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="94.46875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">training_step</span></div></foreignObject></g></g><g transform="translate(134.0390625, 269)" id="flowchart-F-232" class="node default default flowchart-label"><rect height="34" width="103.8125" y="-17" x="-51.90625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-44.40625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="88.8125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">guess_labels</span></div></foreignObject></g></g><g transform="translate(134.0390625, 353)" id="flowchart-G-233" class="node default default flowchart-label"><rect height="34" width="71.234375" y="-17" x="-35.6171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-28.1171875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="56.234375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">sharpen</span></div></foreignObject></g></g><g transform="translate(134.0390625, 437)" id="flowchart-H-234" class="node default default flowchart-label"><rect height="34" width="66.90625" y="-17" x="-33.453125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-25.953125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="51.90625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">mix_up</span></div></foreignObject></g></g><g transform="translate(61.359375, 521)" id="flowchart-I-235" class="node default default flowchart-label"><rect height="34" width="71.859375" y="-17" x="-35.9296875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-28.4296875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="56.859375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss_unl</span></div></foreignObject></g></g><g transform="translate(61.359375, 605)" id="flowchart-J-236" class="node default default flowchart-label"><rect height="34" width="122.71875" y="-17" x="-61.359375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-53.859375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="107.71875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss_unl_scaler</span></div></foreignObject></g></g><g transform="translate(134.0390625, 689)" id="flowchart-L-237" class="node default default flowchart-label"><rect height="34" width="41.265625" y="-17" x="-20.6328125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-13.1328125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="26.265625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss</span></div></foreignObject></g></g><g transform="translate(206.71875, 605)" id="flowchart-k-239" class="node default default flowchart-label"><rect height="34" width="68" y="-17" x="-34" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-26.5, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="53"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss_lbl</span></div></foreignObject></g></g><g transform="translate(134.0390625, 773)" id="flowchart-M-241" class="node default default flowchart-label"><rect height="34" width="83.765625" y="-17" x="-41.8828125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-34.3828125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="68.765625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">backward</span></div></foreignObject></g></g><g transform="translate(134.0390625, 857)" id="flowchart-D-243" class="node default default flowchart-label"><rect height="34" width="153.484375" y="-17" x="-76.7421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-69.2421875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="138.484375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">on_after_backward</span></div></foreignObject></g></g><g transform="translate(134.0390625, 941)" id="flowchart-E-245" class="node default default flowchart-label"><rect height="34" width="103.859375" y="-17" x="-51.9296875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-44.4296875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="88.859375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">update_ema</span></div></foreignObject></g></g><g transform="translate(301.2421875, 185)" id="flowchart-VC-247" class="node default default flowchart-label"><rect height="34" width="124.9375" y="-17" x="-62.46875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-54.96875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="109.9375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">validation_step</span></div></foreignObject></g></g><g transform="translate(301.2421875, 269)" id="flowchart-VL-248" class="node default default flowchart-label"><rect height="34" width="41.265625" y="-17" x="-20.6328125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-13.1328125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="26.265625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">loss</span></div></foreignObject></g></g></g></g></g></svg><p id="9934f4e1_266">Finally, we show an example of how to use the MixMatch module:</p><div class="code-block" data-lang="python"         >
 from sklearn.preprocessing import StandardScaler, OrdinalEncoder
 
 from frdc.train.mixmatch_module import MixMatchModule
@@ -60,7 +60,7 @@
    sharpen_temp=0.5,
    mix_beta_alpha=0.75,
 )
-</div><p id="85c3129d_215">In particular, we need to supply some transformations for the preprocessing step. In this case, we use <code class="code" id="85c3129d_216">StandardScaler</code> to scale the data, and <code class="code" id="85c3129d_217">OrdinalEncoder</code> to encode the labels.</p><ol class="list _decimal" id="85c3129d_218" type="1"><li class="list__item" id="85c3129d_219"><p>It's best if standardization is done only on the training data, and not the validation data to better fit real-world scenarios.</p></li><li class="list__item" id="85c3129d_220"><p>We use <code class="code" id="85c3129d_221">OrdinalEncoder</code> as it handles unseen labels. So if a class doesn't show up in the training data, it will be encoded as <code class="code" id="85c3129d_222">np.nan</code>, and will not participate in the loss calculation.</p></li></ol><aside class="prompt" data-type="warning" data-title="" id="85c3129d_223"><p id="85c3129d_224">Due to the nature of how we handle unseen labels, the performance can be an overestimate. This is because the model will not be penalized for misclassifying unseen labels.</p></aside></section><section class="chapter"><h2 id="design-choices" data-toc="design-choices"   >Design Choices</h2><section class="chapter"><h3 id="static-method-overriding" data-toc="static-method-overriding"   >Static Method Overriding</h3><p id="85c3129d_225">We implement many functions as static, as we believe that a functional style reduces dependencies, thus making the code easier to test and debug.</p><p id="85c3129d_226">Furthermore, it allows the subclasses to easily override the functions, to customize the behavior of the MixMatch module.</p><p id="85c3129d_227">For example, the <code class="code" id="85c3129d_228">loss_unl_scaler</code> function is static, thus, we can implement our own scaling function, and pass it to the MixMatch module.</p><div class="code-block" data-lang="python"         >
+</div><p id="9934f4e1_268">In particular, we need to supply some transformations for the preprocessing step. In this case, we use <code class="code" id="9934f4e1_269">StandardScaler</code> to scale the data, and <code class="code" id="9934f4e1_270">OrdinalEncoder</code> to encode the labels.</p><ol class="list _decimal" id="9934f4e1_271" type="1"><li class="list__item" id="9934f4e1_272"><p>It's best if standardization is done only on the training data, and not the validation data to better fit real-world scenarios.</p></li><li class="list__item" id="9934f4e1_273"><p>We use <code class="code" id="9934f4e1_274">OrdinalEncoder</code> as it handles unseen labels. So if a class doesn't show up in the training data, it will be encoded as <code class="code" id="9934f4e1_275">np.nan</code>, and will not participate in the loss calculation.</p></li></ol><aside class="prompt" data-type="warning" data-title="" id="9934f4e1_276"><p id="9934f4e1_277">Due to the nature of how we handle unseen labels, the performance can be an overestimate. This is because the model will not be penalized for misclassifying unseen labels.</p></aside></section><section class="chapter"><h2 id="design-choices" data-toc="design-choices"   >Design Choices</h2><section class="chapter"><h3 id="static-method-overriding" data-toc="static-method-overriding"   >Static Method Overriding</h3><p id="9934f4e1_278">We implement many functions as static, as we believe that a functional style reduces dependencies, thus making the code easier to test and debug.</p><p id="9934f4e1_279">Furthermore, it allows the subclasses to easily override the functions, to customize the behavior of the MixMatch module.</p><p id="9934f4e1_280">For example, the <code class="code" id="9934f4e1_281">loss_unl_scaler</code> function is static, thus, we can implement our own scaling function, and pass it to the MixMatch module.</p><div class="code-block" data-lang="python"         >
 def my_loss_unl_scaler(progress: float) -&gt; float:
     return progress ** 2
     
@@ -68,4 +68,4 @@
     @staticmethod
     def loss_unl_scaler(progress: float) -&gt; float:
         return my_loss_unl_scaler(progress)
-</div><p id="85c3129d_230">If we had used a method instead, we would have to consider instance state, which would make it harder to override.</p></section><section class="chapter"><h3 id="why-not-use-dataclasses" data-toc="why-not-use-dataclasses"   >Why not use Dataclasses?</h3><p id="85c3129d_231">One of the biggest caveats of <code class="code" id="85c3129d_232">nn.Module</code> is that it requires <code class="code" id="85c3129d_233">super().__init__()</code> to be called before anything is assigned. While <code class="code" id="85c3129d_234">dataclass</code> can leverage <code class="code" id="85c3129d_235">__post_init__</code> to do the same, we felt that this was too much of a hassle to save a few keystrokes. Thus, we opted to use <code class="code" id="85c3129d_236">__init__</code> instead, while more verbose, it is more explicit.</p></section><section class="chapter"><h3 id="why-use-pytorch-lightning" data-toc="why-use-pytorch-lightning"   >Why use PyTorch Lightning?</h3><p id="85c3129d_237">While we did hit some road blocks implementing SSL, due to its complex and unconventional nature, we felt that the benefits of using PyTorch Lightning outweighed the cons.</p><p id="85c3129d_238"><code class="code" id="85c3129d_239">on_before_batch_transfer</code> and <code class="code" id="85c3129d_240">on_after_backward</code> are unconventional hooks, and we had to do some digging to find them. It can be argued that by just writing explicit code, we can avoid the need for these hooks, but the PyTorch ecosystem fixes many other issues, so we closed an eye on this.</p></section></section><section class="chapter"><h2 id="references" data-toc="references"   >References</h2><ul class="list _ul" id="85c3129d_241"><li class="list__item" id="85c3129d_242"><p><a href="https://github.com/YU1ut/MixMatch-pytorch/tree/master" id="85c3129d_243"   data-external="true" rel="noopener noreferrer" >YU1ut's PyTorch Implementation</a></p></li><li class="list__item" id="85c3129d_244"><p><a href="https://github.com/google-research/mixmatch" id="85c3129d_245"   data-external="true" rel="noopener noreferrer" >Google Research's TensorFlow Implementation</a></p></li></ul></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="mix-match.html">MixMatch</a>   <a class="navigation-links__next" href="custom-k-aug-dataloaders.html">Custom K-Aug Dataloaders</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><p id="9934f4e1_283">If we had used a method instead, we would have to consider instance state, which would make it harder to override.</p></section><section class="chapter"><h3 id="why-not-use-dataclasses" data-toc="why-not-use-dataclasses"   >Why not use Dataclasses?</h3><p id="9934f4e1_284">One of the biggest caveats of <code class="code" id="9934f4e1_285">nn.Module</code> is that it requires <code class="code" id="9934f4e1_286">super().__init__()</code> to be called before anything is assigned. While <code class="code" id="9934f4e1_287">dataclass</code> can leverage <code class="code" id="9934f4e1_288">__post_init__</code> to do the same, we felt that this was too much of a hassle to save a few keystrokes. Thus, we opted to use <code class="code" id="9934f4e1_289">__init__</code> instead, while more verbose, it is more explicit.</p></section><section class="chapter"><h3 id="why-use-pytorch-lightning" data-toc="why-use-pytorch-lightning"   >Why use PyTorch Lightning?</h3><p id="9934f4e1_290">While we did hit some road blocks implementing SSL, due to its complex and unconventional nature, we felt that the benefits of using PyTorch Lightning outweighed the cons.</p><p id="9934f4e1_291"><code class="code" id="9934f4e1_292">on_before_batch_transfer</code> and <code class="code" id="9934f4e1_293">on_after_backward</code> are unconventional hooks, and we had to do some digging to find them. It can be argued that by just writing explicit code, we can avoid the need for these hooks, but the PyTorch ecosystem fixes many other issues, so we closed an eye on this.</p></section></section><section class="chapter"><h2 id="references" data-toc="references"   >References</h2><ul class="list _ul" id="9934f4e1_294"><li class="list__item" id="9934f4e1_295"><p><a href="https://github.com/YU1ut/MixMatch-pytorch/tree/master" id="9934f4e1_296"   data-external="true" rel="noopener noreferrer" >YU1ut's PyTorch Implementation</a></p></li><li class="list__item" id="9934f4e1_297"><p><a href="https://github.com/google-research/mixmatch" id="9934f4e1_298"   data-external="true" rel="noopener noreferrer" >Google Research's TensorFlow Implementation</a></p></li></ul></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="mix-match.html">MixMatch</a>   <a class="navigation-links__next" href="custom-k-aug-dataloaders.html">Custom K-Aug Dataloaders</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/mix-match.html b/docs/mix-match.html
index dfe195be..80686148 100644
--- a/docs/mix-match.html
+++ b/docs/mix-match.html
@@ -1 +1 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0968833"><meta name="build-number" content="${buildNumber}">       <title>MixMatch | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"implementation-details","level":0,"title":"Implementation Details","anchor":"#implementation-details"},{"id":"references","level":0,"title":"References","anchor":"#references"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="MixMatch | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/mix-match.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="MixMatch | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/mix-match.html#webpage", "url": "/d/0.0.7/mix-match.html", "name": "MixMatch | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="mix-match" data-main-title="MixMatch" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs=""  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="mix-match"   id="mix-match.md">MixMatch</h1>  <p id="4d1f0585_137">In FRDC-ML, we leverage semi-supervised learning to improve the model's performance through better augmentation consistency and using even unlabelled data.</p><p id="4d1f0585_138">The algorithm we use is <a href="https://arxiv.org/abs/1905.02249" id="4d1f0585_139"   data-external="true" rel="noopener noreferrer" >MixMatch</a>. A state-of-the-art semi-supervised learning algorithm. It is based on the idea of consistency regularization, which encourages models to predict the same class even after augmentations that occur naturally in the real world.</p><aside class="prompt" data-type="tip" data-title="" id="4d1f0585_140"><p id="4d1f0585_141">In other words, a picture of a dog should be classified as a dog even if it is horizontally flipped, offset, or is of a different size. Consistency regularization encourages the model to predict the same class consistently.</p></aside><p id="4d1f0585_142">Our implementation of MixMatch is a refactored version of <a href="https://github.com/YU1ut/MixMatch-pytorch/tree/master" id="4d1f0585_143"   data-external="true" rel="noopener noreferrer" >YU1ut/MixMatch-pytorch</a> We've refactored the code to follow more modern PyTorch practices, allowing us to utilize it with modern PyTorch frameworks such as PyTorch Lightning.</p><p id="4d1f0585_144">We won't go through the details of MixMatch here, see <a href="https://fr-dc.github.io/MixMatch-PyTorch-CIFAR10/pipeline.html" id="4d1f0585_145"   data-external="true" rel="noopener noreferrer" >Our Documentation</a> in our <a href="https://github.com/FR-DC/MixMatch-PyTorch-CIFAR10" id="4d1f0585_146"   data-external="true" rel="noopener noreferrer" >MixMatch-PyTorch-CIFAR10</a> repository for more details.</p><section class="chapter"><h2 id="implementation-details" data-toc="implementation-details"   >Implementation Details</h2><ol class="list _decimal" id="4d1f0585_147" type="1"><li class="list__item" id="4d1f0585_148"><p id="4d1f0585_149">How we implemented the MixMatch logic <a href="mix-match-module.html" id="4d1f0585_150" data-tooltip="See frdc/train/mixmatch_module.py."  >MixMatchModule</a></p></li><li class="list__item" id="4d1f0585_151"><p id="4d1f0585_152">How we implemented the unique MixMatch data loading logic <a href="custom-k-aug-dataloaders.html" id="4d1f0585_153" data-tooltip="In MixMatch, implementing the data loading methods is quite unconventional."  >Custom MixMatch Data Loading</a></p></li></ol></section><section class="chapter"><h2 id="references" data-toc="references"   >References</h2><ul class="list _ul" id="4d1f0585_154"><li class="list__item" id="4d1f0585_155"><p><a href="https://github.com/YU1ut/MixMatch-pytorch/tree/master" id="4d1f0585_156"   data-external="true" rel="noopener noreferrer" >YU1ut's PyTorch Implementation</a></p></li><li class="list__item" id="4d1f0585_157"><p><a href="https://github.com/google-research/mixmatch" id="4d1f0585_158"   data-external="true" rel="noopener noreferrer" >Google Research's TensorFlow Implementation</a></p></li></ul></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="retrieve-our-datasets.html">Retrieve our Datasets</a>   <a class="navigation-links__next" href="mix-match-module.html">MixMatch Module</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3916171"><meta name="build-number" content="${buildNumber}">       <title>MixMatch | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"implementation-details","level":0,"title":"Implementation Details","anchor":"#implementation-details"},{"id":"references","level":0,"title":"References","anchor":"#references"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="MixMatch | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/mix-match.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="MixMatch | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/mix-match.html#webpage", "url": "/d/0.0.8/mix-match.html", "name": "MixMatch | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="mix-match" data-main-title="MixMatch" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs=""  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="mix-match"   id="mix-match.md">MixMatch</h1>  <p id="10f7c6f1_189">In FRDC-ML, we leverage semi-supervised learning to improve the model's performance through better augmentation consistency and using even unlabelled data.</p><p id="10f7c6f1_190">The algorithm we use is <a href="https://arxiv.org/abs/1905.02249" id="10f7c6f1_191"   data-external="true" rel="noopener noreferrer" >MixMatch</a>. A state-of-the-art semi-supervised learning algorithm. It is based on the idea of consistency regularization, which encourages models to predict the same class even after augmentations that occur naturally in the real world.</p><aside class="prompt" data-type="tip" data-title="" id="10f7c6f1_192"><p id="10f7c6f1_193">In other words, a picture of a dog should be classified as a dog even if it is horizontally flipped, offset, or is of a different size. Consistency regularization encourages the model to predict the same class consistently.</p></aside><p id="10f7c6f1_194">Our implementation of MixMatch is a refactored version of <a href="https://github.com/YU1ut/MixMatch-pytorch/tree/master" id="10f7c6f1_195"   data-external="true" rel="noopener noreferrer" >YU1ut/MixMatch-pytorch</a> We've refactored the code to follow more modern PyTorch practices, allowing us to utilize it with modern PyTorch frameworks such as PyTorch Lightning.</p><p id="10f7c6f1_196">We won't go through the details of MixMatch here, see <a href="https://fr-dc.github.io/MixMatch-PyTorch-CIFAR10/pipeline.html" id="10f7c6f1_197"   data-external="true" rel="noopener noreferrer" >Our Documentation</a> in our <a href="https://github.com/FR-DC/MixMatch-PyTorch-CIFAR10" id="10f7c6f1_198"   data-external="true" rel="noopener noreferrer" >MixMatch-PyTorch-CIFAR10</a> repository for more details.</p><section class="chapter"><h2 id="implementation-details" data-toc="implementation-details"   >Implementation Details</h2><ol class="list _decimal" id="10f7c6f1_199" type="1"><li class="list__item" id="10f7c6f1_200"><p id="10f7c6f1_201">How we implemented the MixMatch logic <a href="mix-match-module.html" id="10f7c6f1_202" data-tooltip="See frdc/train/mixmatch_module.py."  >MixMatchModule</a></p></li><li class="list__item" id="10f7c6f1_203"><p id="10f7c6f1_204">How we implemented the unique MixMatch data loading logic <a href="custom-k-aug-dataloaders.html" id="10f7c6f1_205" data-tooltip="In MixMatch, implementing the data loading methods is quite unconventional."  >Custom MixMatch Data Loading</a></p></li></ol></section><section class="chapter"><h2 id="references" data-toc="references"   >References</h2><ul class="list _ul" id="10f7c6f1_206"><li class="list__item" id="10f7c6f1_207"><p><a href="https://github.com/YU1ut/MixMatch-pytorch/tree/master" id="10f7c6f1_208"   data-external="true" rel="noopener noreferrer" >YU1ut's PyTorch Implementation</a></p></li><li class="list__item" id="10f7c6f1_209"><p><a href="https://github.com/google-research/mixmatch" id="10f7c6f1_210"   data-external="true" rel="noopener noreferrer" >Google Research's TensorFlow Implementation</a></p></li></ul></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="retrieve-our-datasets.html">Retrieve our Datasets</a>   <a class="navigation-links__next" href="mix-match-module.html">MixMatch Module</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/model-test-chestnut-may-dec.html b/docs/model-test-chestnut-may-dec.html
index fc6ce98e..245427b2 100644
--- a/docs/model-test-chestnut-may-dec.html
+++ b/docs/model-test-chestnut-may-dec.html
@@ -1 +1 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0988847"><meta name="build-number" content="${buildNumber}">       <title>Model Test Chestnut May-Dec | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"motivation","level":0,"title":"Motivation","anchor":"#motivation"},{"id":"methodology","level":0,"title":"Methodology","anchor":"#methodology"},{"id":"model","level":0,"title":"Model","anchor":"#model"},{"id":"preprocessing","level":0,"title":"Preprocessing","anchor":"#preprocessing"},{"id":"hyperparameters","level":0,"title":"Hyperparameters","anchor":"#hyperparameters"},{"id":"results","level":0,"title":"Results","anchor":"#results"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Model Test Chestnut May-Dec | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/model-test-chestnut-may-dec.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Model Test Chestnut May-Dec | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/model-test-chestnut-may-dec.html#webpage", "url": "/d/0.0.7/model-test-chestnut-may-dec.html", "name": "Model Test Chestnut May-Dec | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Model-Test-Chestnut-May-Dec" data-main-title="Model Test Chestnut May-Dec" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="Model Tests"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Model-Test-Chestnut-May-Dec"   id="Model-Test-Chestnut-May-Dec.md">Model Test Chestnut May-Dec</h1>  <p id="43cd37dc_133">This test is used to evaluate the model performance on the Chestnut Nature Park May &amp; December dataset.</p><p id="43cd37dc_134">See this script in <code class="code" id="43cd37dc_135">model_tests/chestnut_dec_may/train.py</code>.</p><section class="chapter"><h2 id="motivation" data-toc="motivation"   >Motivation</h2><p id="43cd37dc_136">The usage of this model will be to classify trees in unseen datasets under different conditions. In this test, we'll evaluate it under a different season.</p><p id="43cd37dc_137">A caveat is that it'll be evaluated on the same set of trees, so it's not a representative of a field-test. However, given difficulties of yielding datasets, this still gives us a good preliminary idea of how the model will perform in different conditions.</p></section><section class="chapter"><h2 id="methodology" data-toc="methodology"   >Methodology</h2><p id="43cd37dc_138">We train on the December dataset, and test on the May dataset.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 512.25 74"  xmlns="http://www.w3.org/2000/svg" width="512.25" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-DecDataset LE-Model" id="L-DecDataset-Model-0" d="M95.984375,21.88159614927502L109.89713541666667,19.817996791062516C123.80989583333333,17.754397432850013,151.63541666666666,13.627198716425006,179.4609375,13.98320986545888C207.28645833333334,14.339221014492756,235.11197916666666,19.178442028985508,249.02473958333334,21.598052536231886L262.9375,24.01766304347826"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-DecDataset LE-Model" id="L-DecDataset-Model-1" d="M95.984375,36.11840385072498L109.89713541666667,38.18200320893748C123.80989583333333,40.24560256714999,151.63541666666666,44.372801283574994,179.4609375,44.01679013454112C207.28645833333334,43.66077898550725,235.11197916666666,38.82155797101449,249.02473958333334,36.40194746376812L262.9375,33.98233695652174"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Model LE-MayDataset" id="L-Model-MayDataset-0" d="M320.234375,29L326.8046875,29C333.375,29,346.515625,29,359.65625,29C372.796875,29,385.9375,29,392.5078125,29L399.078125,29"></path></g><g class="edgeLabels"><g transform="translate(179.4609375, 9.5)" class="edgeLabel"><g transform="translate(-50.609375, -9.5)" class="label"><foreignObject height="19" width="101.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Labelled Train</span></div></foreignObject></g></g><g transform="translate(179.4609375, 48.5)" class="edgeLabel"><g transform="translate(-58.4765625, -9.5)" class="label"><foreignObject height="19" width="116.953125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Unlabelled Train</span></div></foreignObject></g></g><g transform="translate(359.65625, 29)" class="edgeLabel"><g transform="translate(-14.421875, -9.5)" class="label"><foreignObject height="19" width="28.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Test</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(47.9921875, 29)" id="flowchart-DecDataset-126" class="node default default flowchart-label"><rect height="34" width="95.984375" y="-17" x="-47.9921875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-40.4921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="80.984375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">DecDataset</span></div></foreignObject></g></g><g transform="translate(291.5859375, 29)" id="flowchart-Model-127" class="node default default flowchart-label"><rect height="34" width="57.296875" y="-17" x="-28.6484375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-21.1484375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="42.296875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Model</span></div></foreignObject></g></g><g transform="translate(447.6640625, 29)" id="flowchart-MayDataset-131" class="node default default flowchart-label"><rect height="34" width="97.171875" y="-17" x="-48.5859375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-41.0859375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="82.171875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">MayDataset</span></div></foreignObject></g></g></g></g></g></svg><p id="43cd37dc_140">Despite not having any true unlabelled data, we use <a href="mix-match.html" id="43cd37dc_141" data-tooltip="In FRDC-ML, we leverage semi-supervised learning to improve the model's performance through better augmentation consistency and using even unlabelled data."  >MixMatch</a> by treating the labelled data of the December dataset as unlabelled data.</p><aside class="prompt" data-type="warning" data-title="" id="43cd37dc_142"><p id="43cd37dc_143">Ideally, we should have a Validation set to tune the hyperparameters, but given the limitations of the dataset, we'll skip this step.</p></aside></section><section class="chapter"><h2 id="model" data-toc="model"   >Model</h2><p id="43cd37dc_144">The current Model used is a simple InceptionV3 Transfer Learning model, with the last layer replaced with a fully connected layer(s).</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 654.5625 104"  xmlns="http://www.w3.org/2000/svg" width="654.5625" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Input LE-InceptionV3" id="L-Input-InceptionV3-0" d="M52.203125,32.04357131937013L56.369791666666664,29.53630943280844C60.536458333333336,27.029047546246755,68.86979166666667,22.014523773123376,77.203125,19.50726188656169C85.53645833333333,17,93.86979166666667,17,98.03645833333333,17L102.203125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-InceptionV3 LE-FC" id="L-InceptionV3-FC-0" d="M255.078125,17L259.2447916666667,17C263.4114583333333,17,271.7447916666667,17,280.078125,17C288.4114583333333,17,296.7447916666667,17,300.9114583333333,17L305.078125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FC LE-Softmax" id="L-FC-Softmax-0" d="M400.4375,17L404.6041666666667,17C408.7708333333333,17,417.1041666666667,17,425.4375,17C433.7708333333333,17,442.1041666666667,17,446.2708333333333,17L450.4375,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Softmax LE-Output" id="L-Softmax-Output-0" d="M523.6875,17L527.8541666666666,17C532.0208333333334,17,540.3541666666666,17,548.8014058265583,19.291666666666668C557.2486449864499,21.583333333333332,565.8097899728997,26.166666666666668,570.0903624661247,28.458333333333332L574.3709349593496,30.75"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Input LE-Output" id="L-Input-Output-0" d="M52.203125,63.45642868062987L56.369791666666664,65.96369056719156C60.536458333333336,68.47095245375324,68.86979166666667,73.48547622687663,89.94270833333333,75.9927381134383C111.015625,78.5,144.828125,78.5,178.640625,78.5C212.453125,78.5,246.265625,78.5,275.28515625,78.5C304.3046875,78.5,328.53125,78.5,352.7578125,78.5C376.984375,78.5,401.2109375,78.5,423.5950520833333,78.5C445.9791666666667,78.5,466.5208333333333,78.5,487.0625,78.5C507.6041666666667,78.5,528.1458333333334,78.5,542.6972391598916,76.20833333333333C557.2486449864499,73.91666666666667,565.8097899728997,69.33333333333333,570.0903624661247,67.04166666666667L574.3709349593496,64.75"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g transform="translate(352.7578125, 78.5)" class="edgeLabel"><g transform="translate(-28.6796875, -9.5)" class="label"><foreignObject height="19" width="57.359375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">SSL Loss</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(26.1015625, 47.75)" id="flowchart-Input-188" class="node default default flowchart-label"><rect height="34" width="52.203125" y="-17" x="-26.1015625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-18.6015625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="37.203125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Input</span></div></foreignObject></g></g><g transform="translate(178.640625, 17)" id="flowchart-InceptionV3-189" class="node default default flowchart-label"><rect height="34" width="152.875" y="-17" x="-76.4375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-68.9375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="137.875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">InceptionV3 Frozen</span></div></foreignObject></g></g><g transform="translate(352.7578125, 17)" id="flowchart-FC-191" class="node default default flowchart-label"><rect height="34" width="95.359375" y="-17" x="-47.6796875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-40.1796875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="80.359375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">FC Layer(s)</span></div></foreignObject></g></g><g transform="translate(487.0625, 17)" id="flowchart-Softmax-193" class="node default default flowchart-label"><rect height="34" width="73.25" y="-17" x="-36.625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-29.125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="58.25"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Softmax</span></div></foreignObject></g></g><g transform="translate(606.125, 47.75)" id="flowchart-Output-195" class="node default default flowchart-label"><rect height="34" width="64.875" y="-17" x="-32.4375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-24.9375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="49.875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Output</span></div></foreignObject></g></g></g></g></g></svg><aside class="prompt" data-type="tip" data-title="" id="43cd37dc_146"><p id="43cd37dc_147">We didn't find significant evidence of improvements of using a more complex FC layer, so multiple or single FC layer are feasible.</p></aside></section><section class="chapter"><h2 id="preprocessing" data-toc="preprocessing"   >Preprocessing</h2><p id="43cd37dc_148">For Training:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 969.15625 50"  xmlns="http://www.w3.org/2000/svg" width="969.15625" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M76.546875,17L80.71354166666667,17C84.88020833333333,17,93.21354166666667,17,101.546875,17C109.88020833333333,17,118.21354166666667,17,122.38020833333333,17L126.546875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M262.078125,17L266.2447916666667,17C270.4114583333333,17,278.7447916666667,17,287.078125,17C295.4114583333333,17,303.7447916666667,17,307.9114583333333,17L312.078125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M463.921875,17L468.0885416666667,17C472.2552083333333,17,480.5885416666667,17,488.921875,17C497.2552083333333,17,505.5885416666667,17,509.7552083333333,17L513.921875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-D LE-E" id="L-D-E-0" d="M646.8125,17L650.9791666666666,17C655.1458333333334,17,663.4791666666666,17,671.8125,17C680.1458333333334,17,688.4791666666666,17,692.6458333333334,17L696.8125,17"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(38.2734375, 17)" id="flowchart-A-277" class="node default default flowchart-label"><rect height="34" width="76.546875" y="-17" x="-38.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-30.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="61.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Segment</span></div></foreignObject></g></g><g transform="translate(194.3125, 17)" id="flowchart-B-278" class="node default default flowchart-label"><rect height="34" width="135.53125" y="-17" x="-67.765625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-60.265625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="120.53125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">RandomCrop 299</span></div></foreignObject></g></g><g transform="translate(388, 17)" id="flowchart-C-280" class="node default default flowchart-label"><rect height="34" width="151.84375" y="-17" x="-75.921875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-68.421875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="136.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Horizontal Flip 50%</span></div></foreignObject></g></g><g transform="translate(580.3671875, 17)" id="flowchart-D-282" class="node default default flowchart-label"><rect height="34" width="132.890625" y="-17" x="-66.4453125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-58.9453125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="117.890625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Vertical Flip 50%</span></div></foreignObject></g></g><g transform="translate(824.984375, 17)" id="flowchart-E-284" class="node default default flowchart-label"><rect height="34" width="256.34375" y="-17" x="-128.171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-120.671875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="241.34375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Normalize By Training Mean &amp; Std</span></div></foreignObject></g></g></g></g></g></svg><p id="43cd37dc_150">For Validation:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 575.5 50"  xmlns="http://www.w3.org/2000/svg" width="575.5" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M76.546875,17L80.71354166666667,17C84.88020833333333,17,93.21354166666667,17,101.546875,17C109.88020833333333,17,118.21354166666667,17,122.38020833333333,17L126.546875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M253.15625,17L257.3229166666667,17C261.4895833333333,17,269.8229166666667,17,278.15625,17C286.4895833333333,17,294.8229166666667,17,298.9895833333333,17L303.15625,17"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(38.2734375, 17)" id="flowchart-A-293" class="node default default flowchart-label"><rect height="34" width="76.546875" y="-17" x="-38.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-30.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="61.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Segment</span></div></foreignObject></g></g><g transform="translate(189.8515625, 17)" id="flowchart-B-294" class="node default default flowchart-label"><rect height="34" width="126.609375" y="-17" x="-63.3046875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-55.8046875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="111.609375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">CenterCrop 299</span></div></foreignObject></g></g><g transform="translate(431.328125, 17)" id="flowchart-C-296" class="node default default flowchart-label"><rect height="34" width="256.34375" y="-17" x="-128.171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-120.671875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="241.34375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Normalize By Training Mean &amp; Std</span></div></foreignObject></g></g></g></g></g></svg><p id="43cd37dc_152">For Evaluation:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 822.34375 302"  xmlns="http://www.w3.org/2000/svg" width="822.34375" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M76.546875,143L80.71354166666667,143C84.88020833333333,143,93.21354166666667,143,101.546875,143C109.88020833333333,143,118.21354166666667,143,122.38020833333333,143L126.546875,143"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M253.15625,143L257.3229166666667,143C261.4895833333333,143,269.8229166666667,143,278.15625,143C286.4895833333333,143,294.8229166666667,143,298.9895833333333,143L303.15625,143"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M451.9941716269841,126L474.0784763558201,107.83333333333333C496.16278108465605,89.66666666666667,540.331390542328,53.333333333333336,579.0966848544973,35.166666666666664C617.8619791666666,17,651.2239583333334,17,667.9049479166666,17L684.5859375,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-E" id="L-C-E-0" d="M493.3262648809524,126L508.5218874007937,121.83333333333333C523.7175099206349,117.66666666666667,554.1087549603175,109.33333333333333,579.821304563492,105.16666666666667C605.5338541666666,101,626.5677083333334,101,637.0846354166666,101L647.6015625,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-F" id="L-C-F-0" d="M493.3262648809524,160L508.5218874007937,164.16666666666666C523.7175099206349,168.33333333333334,554.1087549603175,176.66666666666666,581.4007316468254,180.83333333333334C608.6927083333334,185,632.8854166666666,185,644.9817708333334,185L657.078125,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-G" id="L-C-G-0" d="M451.9941716269841,160L474.0784763558201,178.16666666666666C496.16278108465605,196.33333333333334,540.331390542328,232.66666666666666,566.5823619378307,250.83333333333334C592.8333333333334,269,601.1666666666666,269,605.3333333333334,269L609.5,269"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(38.2734375, 143)" id="flowchart-A-321" class="node default default flowchart-label"><rect height="34" width="76.546875" y="-17" x="-38.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-30.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="61.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Segment</span></div></foreignObject></g></g><g transform="translate(189.8515625, 143)" id="flowchart-B-322" class="node default default flowchart-label"><rect height="34" width="126.609375" y="-17" x="-63.3046875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-55.8046875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="111.609375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">CenterCrop 299</span></div></foreignObject></g></g><g transform="translate(431.328125, 143)" id="flowchart-C-324" class="node default default flowchart-label"><rect height="34" width="256.34375" y="-17" x="-128.171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-120.671875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="241.34375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Normalize By Training Mean &amp; Std</span></div></foreignObject></g></g><g transform="translate(707.921875, 17)" id="flowchart-D-326" class="node default default flowchart-label"><rect height="34" width="46.671875" y="-17" x="-23.3359375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-15.8359375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="31.671875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">As Is</span></div></foreignObject></g></g><g transform="translate(707.921875, 101)" id="flowchart-E-328" class="node default default flowchart-label"><rect height="34" width="120.640625" y="-17" x="-60.3203125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-52.8203125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="105.640625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Horizontal Flip</span></div></foreignObject></g></g><g transform="translate(707.921875, 185)" id="flowchart-F-330" class="node default default flowchart-label"><rect height="34" width="101.6875" y="-17" x="-50.84375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-43.34375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="86.6875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Vertical Flip</span></div></foreignObject></g></g><g transform="translate(707.921875, 269)" id="flowchart-G-332" class="node default default flowchart-label"><rect height="34" width="196.84375" y="-17" x="-98.421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-90.921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="181.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Horizontal &amp; Vertical Flip</span></div></foreignObject></g></g></g></g></g></svg><p id="43cd37dc_154">For evaluation, we evaluate that the model should be invariant to horizontal and vertical flips, as well as the original image.</p></section><section class="chapter"><h2 id="hyperparameters" data-toc="hyperparameters"   >Hyperparameters</h2><p id="43cd37dc_155">The following hyperparameters are used:</p><ul class="list _ul" id="43cd37dc_156"><li class="list__item" id="43cd37dc_157"><p>Optimizer: Adam</p></li><li class="list__item" id="43cd37dc_158"><p>Learning Rate: 1e-3</p></li><li class="list__item" id="43cd37dc_159"><p>Batch Size: 32</p></li><li class="list__item" id="43cd37dc_160"><p>Epochs: 10</p></li><li class="list__item" id="43cd37dc_161"><p>Train Iterations: 25~100</p></li><li class="list__item" id="43cd37dc_162"><p>Validation Iterations: 10~25</p></li><li class="list__item" id="43cd37dc_163"><p>Early Stopping: 4</p></li></ul></section><section class="chapter"><h2 id="results" data-toc="results"   >Results</h2><p id="43cd37dc_164">We evaluate around 40% accuracy on the test set, compared to 100% for the training set. This indicates that the model has saturated and is not able to learn anymore from the training set. There's no indication of overfitting as the validation loss just plateaus.</p><p id="43cd37dc_165"><a href="https://wandb.ai/frdc/FRDC-ML-tests_model_tests_chestnut_dec_may" id="43cd37dc_166"   data-external="true" rel="noopener noreferrer" >W&amp;B Dashboard</a></p><section class="chapter"><h3 id="caveats" data-toc="caveats"   >Caveats</h3><ul class="list _ul" id="43cd37dc_167"><li class="list__item" id="43cd37dc_168"><p>The test set is very small, so the results are not very representative.</p></li><li class="list__item" id="43cd37dc_169"><p>The test set is the same set of trees, so it's not a true test of the model performance in different conditions.</p></li><li class="list__item" id="43cd37dc_170"><p>There are many classes with 1 sample, so the model may not be able to learn the features of these classes well.</p></li></ul></section></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="custom-k-aug-dataloaders.html">Custom K-Aug Dataloaders</a>   <a class="navigation-links__next" href="load-dataset.html">load.dataset</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3935045"><meta name="build-number" content="${buildNumber}">       <title>Model Test Chestnut May-Dec | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"motivation","level":0,"title":"Motivation","anchor":"#motivation"},{"id":"methodology","level":0,"title":"Methodology","anchor":"#methodology"},{"id":"model","level":0,"title":"Model","anchor":"#model"},{"id":"preprocessing","level":0,"title":"Preprocessing","anchor":"#preprocessing"},{"id":"hyperparameters","level":0,"title":"Hyperparameters","anchor":"#hyperparameters"},{"id":"results","level":0,"title":"Results","anchor":"#results"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Model Test Chestnut May-Dec | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/model-test-chestnut-may-dec.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Model Test Chestnut May-Dec | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/model-test-chestnut-may-dec.html#webpage", "url": "/d/0.0.8/model-test-chestnut-may-dec.html", "name": "Model Test Chestnut May-Dec | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Model-Test-Chestnut-May-Dec" data-main-title="Model Test Chestnut May-Dec" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="Model Tests"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Model-Test-Chestnut-May-Dec"   id="Model-Test-Chestnut-May-Dec.md">Model Test Chestnut May-Dec</h1>  <p id="6c379365_185">This test is used to evaluate the model performance on the Chestnut Nature Park May &amp; December dataset.</p><p id="6c379365_186">See this script in <code class="code" id="6c379365_187">model_tests/chestnut_dec_may/train.py</code>.</p><section class="chapter"><h2 id="motivation" data-toc="motivation"   >Motivation</h2><p id="6c379365_188">The usage of this model will be to classify trees in unseen datasets under different conditions. In this test, we'll evaluate it under a different season.</p><p id="6c379365_189">A caveat is that it'll be evaluated on the same set of trees, so it's not a representative of a field-test. However, given difficulties of yielding datasets, this still gives us a good preliminary idea of how the model will perform in different conditions.</p></section><section class="chapter"><h2 id="methodology" data-toc="methodology"   >Methodology</h2><p id="6c379365_190">We train on the December dataset, and test on the May dataset.</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 512.25 74"  xmlns="http://www.w3.org/2000/svg" width="512.25" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-DecDataset LE-Model" id="L-DecDataset-Model-0" d="M95.984375,21.88159614927502L109.89713541666667,19.817996791062516C123.80989583333333,17.754397432850013,151.63541666666666,13.627198716425006,179.4609375,13.98320986545888C207.28645833333334,14.339221014492756,235.11197916666666,19.178442028985508,249.02473958333334,21.598052536231886L262.9375,24.01766304347826"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-DecDataset LE-Model" id="L-DecDataset-Model-1" d="M95.984375,36.11840385072498L109.89713541666667,38.18200320893748C123.80989583333333,40.24560256714999,151.63541666666666,44.372801283574994,179.4609375,44.01679013454112C207.28645833333334,43.66077898550725,235.11197916666666,38.82155797101449,249.02473958333334,36.40194746376812L262.9375,33.98233695652174"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Model LE-MayDataset" id="L-Model-MayDataset-0" d="M320.234375,29L326.8046875,29C333.375,29,346.515625,29,359.65625,29C372.796875,29,385.9375,29,392.5078125,29L399.078125,29"></path></g><g class="edgeLabels"><g transform="translate(179.4609375, 9.5)" class="edgeLabel"><g transform="translate(-50.609375, -9.5)" class="label"><foreignObject height="19" width="101.21875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Labelled Train</span></div></foreignObject></g></g><g transform="translate(179.4609375, 48.5)" class="edgeLabel"><g transform="translate(-58.4765625, -9.5)" class="label"><foreignObject height="19" width="116.953125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Unlabelled Train</span></div></foreignObject></g></g><g transform="translate(359.65625, 29)" class="edgeLabel"><g transform="translate(-14.421875, -9.5)" class="label"><foreignObject height="19" width="28.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">Test</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(47.9921875, 29)" id="flowchart-DecDataset-114" class="node default default flowchart-label"><rect height="34" width="95.984375" y="-17" x="-47.9921875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-40.4921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="80.984375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">DecDataset</span></div></foreignObject></g></g><g transform="translate(291.5859375, 29)" id="flowchart-Model-115" class="node default default flowchart-label"><rect height="34" width="57.296875" y="-17" x="-28.6484375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-21.1484375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="42.296875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Model</span></div></foreignObject></g></g><g transform="translate(447.6640625, 29)" id="flowchart-MayDataset-119" class="node default default flowchart-label"><rect height="34" width="97.171875" y="-17" x="-48.5859375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-41.0859375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="82.171875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">MayDataset</span></div></foreignObject></g></g></g></g></g></svg><p id="6c379365_192">Despite not having any true unlabelled data, we use <a href="mix-match.html" id="6c379365_193" data-tooltip="In FRDC-ML, we leverage semi-supervised learning to improve the model's performance through better augmentation consistency and using even unlabelled data."  >MixMatch</a> by treating the labelled data of the December dataset as unlabelled data.</p><aside class="prompt" data-type="warning" data-title="" id="6c379365_194"><p id="6c379365_195">Ideally, we should have a Validation set to tune the hyperparameters, but given the limitations of the dataset, we'll skip this step.</p></aside></section><section class="chapter"><h2 id="model" data-toc="model"   >Model</h2><p id="6c379365_196">The current Model used is a simple InceptionV3 Transfer Learning model, with the last layer replaced with a fully connected layer(s).</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 654.5625 104"  xmlns="http://www.w3.org/2000/svg" width="654.5625" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Input LE-InceptionV3" id="L-Input-InceptionV3-0" d="M52.203125,32.04357131937013L56.369791666666664,29.53630943280844C60.536458333333336,27.029047546246755,68.86979166666667,22.014523773123376,77.203125,19.50726188656169C85.53645833333333,17,93.86979166666667,17,98.03645833333333,17L102.203125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-InceptionV3 LE-FC" id="L-InceptionV3-FC-0" d="M255.078125,17L259.2447916666667,17C263.4114583333333,17,271.7447916666667,17,280.078125,17C288.4114583333333,17,296.7447916666667,17,300.9114583333333,17L305.078125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-FC LE-Softmax" id="L-FC-Softmax-0" d="M400.4375,17L404.6041666666667,17C408.7708333333333,17,417.1041666666667,17,425.4375,17C433.7708333333333,17,442.1041666666667,17,446.2708333333333,17L450.4375,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Softmax LE-Output" id="L-Softmax-Output-0" d="M523.6875,17L527.8541666666666,17C532.0208333333334,17,540.3541666666666,17,548.8014058265583,19.291666666666668C557.2486449864499,21.583333333333332,565.8097899728997,26.166666666666668,570.0903624661247,28.458333333333332L574.3709349593496,30.75"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-Input LE-Output" id="L-Input-Output-0" d="M52.203125,63.45642868062987L56.369791666666664,65.96369056719156C60.536458333333336,68.47095245375324,68.86979166666667,73.48547622687663,89.94270833333333,75.9927381134383C111.015625,78.5,144.828125,78.5,178.640625,78.5C212.453125,78.5,246.265625,78.5,275.28515625,78.5C304.3046875,78.5,328.53125,78.5,352.7578125,78.5C376.984375,78.5,401.2109375,78.5,423.5950520833333,78.5C445.9791666666667,78.5,466.5208333333333,78.5,487.0625,78.5C507.6041666666667,78.5,528.1458333333334,78.5,542.6972391598916,76.20833333333333C557.2486449864499,73.91666666666667,565.8097899728997,69.33333333333333,570.0903624661247,67.04166666666667L574.3709349593496,64.75"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g transform="translate(352.7578125, 78.5)" class="edgeLabel"><g transform="translate(-28.6796875, -9.5)" class="label"><foreignObject height="19" width="57.359375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel">SSL Loss</span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(26.1015625, 47.75)" id="flowchart-Input-176" class="node default default flowchart-label"><rect height="34" width="52.203125" y="-17" x="-26.1015625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-18.6015625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="37.203125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Input</span></div></foreignObject></g></g><g transform="translate(178.640625, 17)" id="flowchart-InceptionV3-177" class="node default default flowchart-label"><rect height="34" width="152.875" y="-17" x="-76.4375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-68.9375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="137.875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">InceptionV3 Frozen</span></div></foreignObject></g></g><g transform="translate(352.7578125, 17)" id="flowchart-FC-179" class="node default default flowchart-label"><rect height="34" width="95.359375" y="-17" x="-47.6796875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-40.1796875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="80.359375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">FC Layer(s)</span></div></foreignObject></g></g><g transform="translate(487.0625, 17)" id="flowchart-Softmax-181" class="node default default flowchart-label"><rect height="34" width="73.25" y="-17" x="-36.625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-29.125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="58.25"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Softmax</span></div></foreignObject></g></g><g transform="translate(606.125, 47.75)" id="flowchart-Output-183" class="node default default flowchart-label"><rect height="34" width="64.875" y="-17" x="-32.4375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-24.9375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="49.875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Output</span></div></foreignObject></g></g></g></g></g></svg><aside class="prompt" data-type="tip" data-title="" id="6c379365_198"><p id="6c379365_199">We didn't find significant evidence of improvements of using a more complex FC layer, so multiple or single FC layer are feasible.</p></aside></section><section class="chapter"><h2 id="preprocessing" data-toc="preprocessing"   >Preprocessing</h2><p id="6c379365_200">For Training:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 969.15625 50"  xmlns="http://www.w3.org/2000/svg" width="969.15625" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M76.546875,17L80.71354166666667,17C84.88020833333333,17,93.21354166666667,17,101.546875,17C109.88020833333333,17,118.21354166666667,17,122.38020833333333,17L126.546875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M262.078125,17L266.2447916666667,17C270.4114583333333,17,278.7447916666667,17,287.078125,17C295.4114583333333,17,303.7447916666667,17,307.9114583333333,17L312.078125,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M463.921875,17L468.0885416666667,17C472.2552083333333,17,480.5885416666667,17,488.921875,17C497.2552083333333,17,505.5885416666667,17,509.7552083333333,17L513.921875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-D LE-E" id="L-D-E-0" d="M646.8125,17L650.9791666666666,17C655.1458333333334,17,663.4791666666666,17,671.8125,17C680.1458333333334,17,688.4791666666666,17,692.6458333333334,17L696.8125,17"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(38.2734375, 17)" id="flowchart-A-265" class="node default default flowchart-label"><rect height="34" width="76.546875" y="-17" x="-38.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-30.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="61.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Segment</span></div></foreignObject></g></g><g transform="translate(194.3125, 17)" id="flowchart-B-266" class="node default default flowchart-label"><rect height="34" width="135.53125" y="-17" x="-67.765625" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-60.265625, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="120.53125"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">RandomCrop 299</span></div></foreignObject></g></g><g transform="translate(388, 17)" id="flowchart-C-268" class="node default default flowchart-label"><rect height="34" width="151.84375" y="-17" x="-75.921875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-68.421875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="136.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Horizontal Flip 50%</span></div></foreignObject></g></g><g transform="translate(580.3671875, 17)" id="flowchart-D-270" class="node default default flowchart-label"><rect height="34" width="132.890625" y="-17" x="-66.4453125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-58.9453125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="117.890625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Vertical Flip 50%</span></div></foreignObject></g></g><g transform="translate(824.984375, 17)" id="flowchart-E-272" class="node default default flowchart-label"><rect height="34" width="256.34375" y="-17" x="-128.171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-120.671875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="241.34375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Normalize By Training Mean &amp; Std</span></div></foreignObject></g></g></g></g></g></svg><p id="6c379365_202">For Validation:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 575.5 50"  xmlns="http://www.w3.org/2000/svg" width="575.5" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M76.546875,17L80.71354166666667,17C84.88020833333333,17,93.21354166666667,17,101.546875,17C109.88020833333333,17,118.21354166666667,17,122.38020833333333,17L126.546875,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M253.15625,17L257.3229166666667,17C261.4895833333333,17,269.8229166666667,17,278.15625,17C286.4895833333333,17,294.8229166666667,17,298.9895833333333,17L303.15625,17"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(38.2734375, 17)" id="flowchart-A-281" class="node default default flowchart-label"><rect height="34" width="76.546875" y="-17" x="-38.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-30.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="61.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Segment</span></div></foreignObject></g></g><g transform="translate(189.8515625, 17)" id="flowchart-B-282" class="node default default flowchart-label"><rect height="34" width="126.609375" y="-17" x="-63.3046875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-55.8046875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="111.609375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">CenterCrop 299</span></div></foreignObject></g></g><g transform="translate(431.328125, 17)" id="flowchart-C-284" class="node default default flowchart-label"><rect height="34" width="256.34375" y="-17" x="-128.171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-120.671875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="241.34375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Normalize By Training Mean &amp; Std</span></div></foreignObject></g></g></g></g></g></svg><p id="6c379365_204">For Evaluation:</p><svg aria-roledescription="flowchart-v2" role="graphics-document document" viewBox="-8 -8 822.34375 302"  xmlns="http://www.w3.org/2000/svg" width="822.34375" id="mermaid"><g><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="10" viewBox="0 0 12 20" class="marker flowchart" id="flowchart-pointEnd"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 0 L 10 5 L 0 10 z"></path></marker><marker orient="auto" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="0" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-pointStart"><path style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 0 5 L 10 10 L 10 0 z"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="11" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleEnd"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5" refX="-1" viewBox="0 0 10 10" class="marker flowchart" id="flowchart-circleStart"><circle style="stroke-width: 1; stroke-dasharray: 1, 0;" class="arrowMarkerPath" r="5" cy="5" cx="5"></circle></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="12" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossEnd"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><marker orient="auto" markerHeight="11" markerWidth="11" markerUnits="userSpaceOnUse" refY="5.2" refX="-1" viewBox="0 0 11 11" class="marker cross flowchart" id="flowchart-crossStart"><path style="stroke-width: 2; stroke-dasharray: 1, 0;" class="arrowMarkerPath" d="M 1,1 l 9,9 M 10,1 l -9,9"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-A LE-B" id="L-A-B-0" d="M76.546875,143L80.71354166666667,143C84.88020833333333,143,93.21354166666667,143,101.546875,143C109.88020833333333,143,118.21354166666667,143,122.38020833333333,143L126.546875,143"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-B LE-C" id="L-B-C-0" d="M253.15625,143L257.3229166666667,143C261.4895833333333,143,269.8229166666667,143,278.15625,143C286.4895833333333,143,294.8229166666667,143,298.9895833333333,143L303.15625,143"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-D" id="L-C-D-0" d="M451.9941716269841,126L474.0784763558201,107.83333333333333C496.16278108465605,89.66666666666667,540.331390542328,53.333333333333336,579.0966848544973,35.166666666666664C617.8619791666666,17,651.2239583333334,17,667.9049479166666,17L684.5859375,17"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-E" id="L-C-E-0" d="M493.3262648809524,126L508.5218874007937,121.83333333333333C523.7175099206349,117.66666666666667,554.1087549603175,109.33333333333333,579.821304563492,105.16666666666667C605.5338541666666,101,626.5677083333334,101,637.0846354166666,101L647.6015625,101"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-F" id="L-C-F-0" d="M493.3262648809524,160L508.5218874007937,164.16666666666666C523.7175099206349,168.33333333333334,554.1087549603175,176.66666666666666,581.4007316468254,180.83333333333334C608.6927083333334,185,632.8854166666666,185,644.9817708333334,185L657.078125,185"></path><path marker-end="url(#flowchart-pointEnd)" style="fill:none;" class="edge-thickness-normal edge-pattern-solid flowchart-link LS-C LE-G" id="L-C-G-0" d="M451.9941716269841,160L474.0784763558201,178.16666666666666C496.16278108465605,196.33333333333334,540.331390542328,232.66666666666666,566.5823619378307,250.83333333333334C592.8333333333334,269,601.1666666666666,269,605.3333333333334,269L609.5,269"></path></g><g class="edgeLabels"><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g transform="translate(0, 0)" class="label"><foreignObject height="0" width="0"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g transform="translate(38.2734375, 143)" id="flowchart-A-309" class="node default default flowchart-label"><rect height="34" width="76.546875" y="-17" x="-38.2734375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-30.7734375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="61.546875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Segment</span></div></foreignObject></g></g><g transform="translate(189.8515625, 143)" id="flowchart-B-310" class="node default default flowchart-label"><rect height="34" width="126.609375" y="-17" x="-63.3046875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-55.8046875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="111.609375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">CenterCrop 299</span></div></foreignObject></g></g><g transform="translate(431.328125, 143)" id="flowchart-C-312" class="node default default flowchart-label"><rect height="34" width="256.34375" y="-17" x="-128.171875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-120.671875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="241.34375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Normalize By Training Mean &amp; Std</span></div></foreignObject></g></g><g transform="translate(707.921875, 17)" id="flowchart-D-314" class="node default default flowchart-label"><rect height="34" width="46.671875" y="-17" x="-23.3359375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-15.8359375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="31.671875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">As Is</span></div></foreignObject></g></g><g transform="translate(707.921875, 101)" id="flowchart-E-316" class="node default default flowchart-label"><rect height="34" width="120.640625" y="-17" x="-60.3203125" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-52.8203125, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="105.640625"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Horizontal Flip</span></div></foreignObject></g></g><g transform="translate(707.921875, 185)" id="flowchart-F-318" class="node default default flowchart-label"><rect height="34" width="101.6875" y="-17" x="-50.84375" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-43.34375, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="86.6875"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Vertical Flip</span></div></foreignObject></g></g><g transform="translate(707.921875, 269)" id="flowchart-G-320" class="node default default flowchart-label"><rect height="34" width="196.84375" y="-17" x="-98.421875" ry="0" rx="0" style="" class="basic label-container"></rect><g transform="translate(-90.921875, -9.5)" style="" class="label"><rect></rect><foreignObject height="19" width="181.84375"><div style="display: inline-block; white-space: nowrap;" xmlns="http://www.w3.org/1999/xhtml"><span class="nodeLabel">Horizontal &amp; Vertical Flip</span></div></foreignObject></g></g></g></g></g></svg><p id="6c379365_206">For evaluation, we evaluate that the model should be invariant to horizontal and vertical flips, as well as the original image.</p></section><section class="chapter"><h2 id="hyperparameters" data-toc="hyperparameters"   >Hyperparameters</h2><p id="6c379365_207">The following hyperparameters are used:</p><ul class="list _ul" id="6c379365_208"><li class="list__item" id="6c379365_209"><p>Optimizer: Adam</p></li><li class="list__item" id="6c379365_210"><p>Learning Rate: 1e-3</p></li><li class="list__item" id="6c379365_211"><p>Batch Size: 32</p></li><li class="list__item" id="6c379365_212"><p>Epochs: 10</p></li><li class="list__item" id="6c379365_213"><p>Train Iterations: 25~100</p></li><li class="list__item" id="6c379365_214"><p>Validation Iterations: 10~25</p></li><li class="list__item" id="6c379365_215"><p>Early Stopping: 4</p></li></ul></section><section class="chapter"><h2 id="results" data-toc="results"   >Results</h2><p id="6c379365_216">We evaluate around 40% accuracy on the test set, compared to 100% for the training set. This indicates that the model has saturated and is not able to learn anymore from the training set. There's no indication of overfitting as the validation loss just plateaus.</p><p id="6c379365_217"><a href="https://wandb.ai/frdc/FRDC-ML-tests_model_tests_chestnut_dec_may" id="6c379365_218"   data-external="true" rel="noopener noreferrer" >W&amp;B Dashboard</a></p><section class="chapter"><h3 id="caveats" data-toc="caveats"   >Caveats</h3><ul class="list _ul" id="6c379365_219"><li class="list__item" id="6c379365_220"><p>The test set is very small, so the results are not very representative.</p></li><li class="list__item" id="6c379365_221"><p>The test set is the same set of trees, so it's not a true test of the model performance in different conditions.</p></li><li class="list__item" id="6c379365_222"><p>There are many classes with 1 sample, so the model may not be able to learn the features of these classes well.</p></li></ul></section></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="custom-k-aug-dataloaders.html">Custom K-Aug Dataloaders</a>   <a class="navigation-links__next" href="load-dataset.html">load.dataset</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/overview.html b/docs/overview.html
index 56310435..896ab236 100644
--- a/docs/overview.html
+++ b/docs/overview.html
@@ -1 +1 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0988847"><meta name="build-number" content="${buildNumber}">       <title>Overview | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"other-projects","level":0,"title":"Other Projects","anchor":"#other-projects"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Overview | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/overview.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Overview | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/overview.html#webpage", "url": "/d/0.0.7/overview.html", "name": "Overview | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Overview" data-main-title="Overview" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs=""  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Overview"   id="Overview.md">Overview</h1>  <p id="1da610ba_140">Forest Recovery Digital Companion (FRDC) is a ML-assisted companion for ecologists to automatically classify surveyed trees via an Unmanned Aerial Vehicle (UAV).</p><p id="1da610ba_141">This package, FRDC-ML is the Machine Learning backbone of this project, a centralized repository of tools and model architectures to be used in the FRDC pipeline.</p><p id="1da610ba_142"><a href="getting-started.html" id="1da610ba_143" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  ><span class="control" id="1da610ba_144">Get started here</span></a></p><section class="chapter"><h2 id="other-projects" data-toc="other-projects"   >Other Projects</h2><dl id="1da610ba_145" data-style="title-top"><dt id="1da610ba_146" data-expandable="false">FRDC-UI</dt><dd><p id="1da610ba_148"><a href="https://github.com/Forest-Recovery-Digital-Companion/FRDC-UI/" id="1da610ba_149"   data-external="true" rel="noopener noreferrer" >The User Interface Repository</a> for FRDC, a WebApp GUI for ecologists to adjust annotations.</p></dd></dl></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">   <a class="navigation-links__next" href="getting-started.html">Getting Started</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3935045"><meta name="build-number" content="${buildNumber}">       <title>Overview | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"other-projects","level":0,"title":"Other Projects","anchor":"#other-projects"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Overview | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/overview.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Overview | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/overview.html#webpage", "url": "/d/0.0.8/overview.html", "name": "Overview | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Overview" data-main-title="Overview" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs=""  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Overview"   id="Overview.md">Overview</h1>  <p id="510ed678_199">Forest Recovery Digital Companion (FRDC) is a ML-assisted companion for ecologists to automatically classify surveyed trees via an Unmanned Aerial Vehicle (UAV).</p><p id="510ed678_200">This package, FRDC-ML is the Machine Learning backbone of this project, a centralized repository of tools and model architectures to be used in the FRDC pipeline.</p><p id="510ed678_201"><a href="getting-started.html" id="510ed678_202" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  ><span class="control" id="510ed678_203">Get started here</span></a></p><section class="chapter"><h2 id="other-projects" data-toc="other-projects"   >Other Projects</h2><dl id="510ed678_204" data-style="title-top"><dt id="510ed678_205" data-expandable="false">FRDC-UI</dt><dd><p id="510ed678_207"><a href="https://github.com/Forest-Recovery-Digital-Companion/FRDC-UI/" id="510ed678_208"   data-external="true" rel="noopener noreferrer" >The User Interface Repository</a> for FRDC, a WebApp GUI for ecologists to adjust annotations.</p></dd></dl></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">   <a class="navigation-links__next" href="getting-started.html">Getting Started</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/preprocessing-extract-segments.html b/docs/preprocessing-extract-segments.html
index 6801c5e6..9a248812 100644
--- a/docs/preprocessing-extract-segments.html
+++ b/docs/preprocessing-extract-segments.html
@@ -1,4 +1,4 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.extract_segments | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.extract_segments | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/preprocessing-extract-segments.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.extract_segments | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/preprocessing-extract-segments.html#webpage", "url": "/d/0.0.7/preprocessing-extract-segments.html", "name": "preprocessing.extract_segments | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.extract_segments" data-main-title="preprocessing.extract_segments" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.extract_segments"   id="preprocessing.extract_segments.md">preprocessing.extract_segments</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;cfc7b30f_191\&quot;\u003eExtracts segments from a label classification or bounds and labels.\u003c/p\u003e&quot;]}"></div> <section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><dl id="cfc7b30f_132" data-style="title-left" data-title-width="medium"><dt id="cfc7b30f_133" data-expandable="false">extract_segments_from_labels</dt><dd><p><b id="cfc7b30f_134">Extracts segments from a label classification.</b></p></dd><dt id="cfc7b30f_135" data-expandable="false">extract_segments_from_bounds</dt><dd><p><b id="cfc7b30f_136">Extracts segments from <code class="code" id="cfc7b30f_137">Rect</code> bounds.</b></p></dd><dt id="cfc7b30f_138" data-expandable="false">remove_small_segments_from_labels</dt><dd><p><b id="cfc7b30f_139">Removes small segments from a label classification.</b></p></dd></dl><section class="chapter"><h3 id="extract-with-boundaries" data-toc="extract-with-boundaries"   >Extract with Boundaries</h3><p id="cfc7b30f_140">A boundary is a <code class="code" id="cfc7b30f_141">Rect</code> object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates.</p><p id="cfc7b30f_142">It simply slices the original image to the bounding box. The origin is the top left corner of the image.</p><div class="tabs" id="cfc7b30f_143"><div class="tabs__content" data-gtm="tab" id="cfc7b30f_144" data-title="Cropped = True"><div class="code-block" data-lang="none"    data-title="None"     >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.extract_segments | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.extract_segments | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/preprocessing-extract-segments.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.extract_segments | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/preprocessing-extract-segments.html#webpage", "url": "/d/0.0.8/preprocessing-extract-segments.html", "name": "preprocessing.extract_segments | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.extract_segments" data-main-title="preprocessing.extract_segments" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.extract_segments"   id="preprocessing.extract_segments.md">preprocessing.extract_segments</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;bc40344d_257\&quot;\u003eExtracts segments from a label classification or bounds and labels.\u003c/p\u003e&quot;]}"></div> <section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><dl id="bc40344d_198" data-style="title-left" data-title-width="medium"><dt id="bc40344d_199" data-expandable="false">extract_segments_from_labels</dt><dd><p><b id="bc40344d_200">Extracts segments from a label classification.</b></p></dd><dt id="bc40344d_201" data-expandable="false">extract_segments_from_bounds</dt><dd><p><b id="bc40344d_202">Extracts segments from <code class="code" id="bc40344d_203">Rect</code> bounds.</b></p></dd><dt id="bc40344d_204" data-expandable="false">remove_small_segments_from_labels</dt><dd><p><b id="bc40344d_205">Removes small segments from a label classification.</b></p></dd></dl><section class="chapter"><h3 id="extract-with-boundaries" data-toc="extract-with-boundaries"   >Extract with Boundaries</h3><p id="bc40344d_206">A boundary is a <code class="code" id="bc40344d_207">Rect</code> object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates.</p><p id="bc40344d_208">It simply slices the original image to the bounding box. The origin is the top left corner of the image.</p><div class="tabs" id="bc40344d_209"><div class="tabs__content" data-gtm="tab" id="bc40344d_210" data-title="Cropped = True"><div class="code-block" data-lang="none"    data-title="None"     >
 +-----------------+                +-----------+      
 | Original        |                | Segmented |      
 | Image           |                | Image     |      
@@ -9,7 +9,7 @@
 +-----+-----+-----+   1, 2, 0, 2   +-----+-----+
 |  7  |  8  |  9  |   x0 y0 x1 y1  |  8  |  9  |
 +-----+-----+-----+                +-----+-----+
-</div></div><div class="tabs__content" data-gtm="tab" id="cfc7b30f_146" data-title="Cropped = False"><div class="code-block" data-lang="none"    data-title="None"     >
+</div></div><div class="tabs__content" data-gtm="tab" id="bc40344d_212" data-title="Cropped = False"><div class="code-block" data-lang="none"    data-title="None"     >
 +-----------------+                +-----------------+      
 | Original        |                | Segmented       |      
 | Image           |                | Image           |      
@@ -20,7 +20,7 @@
 +-----+-----+-----+   1, 2, 0, 2   +-----+-----+-----+      
 |  7  |  8  |  9  |   x0 y0 x1 y1  |  0  |  8  |  9  |      
 +-----+-----+-----+                +-----+-----+-----+      
-</div></div></div><aside class="prompt" data-type="warning" data-title="" id="cfc7b30f_148"><p>The shape of an NDArray is usually H x W x C. Thus, if you're manually slicing with the bounds, make sure that you're slicing the correct axis. </p><p id="cfc7b30f_149">The correct syntax should be <code class="code" id="cfc7b30f_150">ar[y0:y1,x0:x1]</code>.</p></aside></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="extract-with-labels" data-toc="extract-with-labels"   >Extract with Labels</h3></div><div class="collapse__content"><p id="cfc7b30f_151">A label classification is a <code class="code" id="cfc7b30f_152">np.ndarray</code> where each pixel is mapped to a segment. The segments are mapped to a unique integer. In our project, the 0th label is the background.</p><p id="cfc7b30f_153">For example, a label classification of 3 segments will look like this:</p><div class="code-block" data-lang="none"         >
+</div></div></div><aside class="prompt" data-type="warning" data-title="" id="bc40344d_214"><p>The shape of an NDArray is usually H x W x C. Thus, if you're manually slicing with the bounds, make sure that you're slicing the correct axis. </p><p id="bc40344d_215">The correct syntax should be <code class="code" id="bc40344d_216">ar[y0:y1,x0:x1]</code>.</p></aside></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="extract-with-labels" data-toc="extract-with-labels"   >Extract with Labels</h3></div><div class="collapse__content"><p id="bc40344d_217">A label classification is a <code class="code" id="bc40344d_218">np.ndarray</code> where each pixel is mapped to a segment. The segments are mapped to a unique integer. In our project, the 0th label is the background.</p><p id="bc40344d_219">For example, a label classification of 3 segments will look like this:</p><div class="code-block" data-lang="none"         >
 +-----------------+  +-----------------+
 | Label           |  | Original        |
 | Classification  |  | Image           |
@@ -31,7 +31,7 @@
 +-----+-----+-----+  +-----+-----+-----+
 |  1  |  1  |  0  |  |  7  |  8  |  9  |
 +-----+-----+-----+  +-----+-----+-----+
-</div><p id="cfc7b30f_155">The extraction will take the <span class="control" id="cfc7b30f_156">minimum bounding box</span> of each segment and return a list of segments.</p><p id="cfc7b30f_157">For example, the label 1 and 2 extracted images will be</p><div class="tabs" id="cfc7b30f_158"><div class="tabs__content" data-gtm="tab" id="cfc7b30f_159" data-title="Cropped = True"><div class="code-block" data-lang="none"    data-title="None"     >
+</div><p id="bc40344d_221">The extraction will take the <span class="control" id="bc40344d_222">minimum bounding box</span> of each segment and return a list of segments.</p><p id="bc40344d_223">For example, the label 1 and 2 extracted images will be</p><div class="tabs" id="bc40344d_224"><div class="tabs__content" data-gtm="tab" id="bc40344d_225" data-title="Cropped = True"><div class="code-block" data-lang="none"    data-title="None"     >
 +-----------+  +-----------+
 | Extracted |  | Extracted |
 | Segment 1 |  | Segment 2 |
@@ -42,7 +42,7 @@
 +-----+-----+  +-----+-----+
 |  7  |  8  |  
 +-----+-----+  
-</div></div><div class="tabs__content" data-gtm="tab" id="cfc7b30f_161" data-title="Cropped = False"><div class="code-block" data-lang="none"    data-title="None"     >
+</div></div><div class="tabs__content" data-gtm="tab" id="bc40344d_227" data-title="Cropped = False"><div class="code-block" data-lang="none"    data-title="None"     >
 +-----------------+  +-----------------+
 | Extracted       |  | Extracted       |
 | Segment 1       |  | Segment 2       |
@@ -53,23 +53,21 @@
 +-----+-----+-----+  +-----+-----+-----+
 |  7  |  8  |  0  |  |  0  |  0  |  0  |
 +-----+-----+-----+  +-----+-----+-----+
-</div></div></div><ul class="list _ul" id="cfc7b30f_163"><li class="list__item" id="cfc7b30f_164"><p>If <span class="control" id="cfc7b30f_165">cropped is False</span>, the segments are padded with 0s to the original image size. While this can ensure shape consistency, it can consume more memory for large images.</p></li><li class="list__item" id="cfc7b30f_166"><p>If <span class="control" id="cfc7b30f_167">cropped is True</span>, the segments are cropped to the minimum bounding box. This can save memory, but the shape of the segments will be inconsistent.</p></li></ul></div></div></section></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><section class="chapter"><h3 id="extract-from-bounds-and-labels" data-toc="extract-from-bounds-and-labels"   >Extract from Bounds and Labels</h3><p id="cfc7b30f_168">Extract segments from bounds and labels.</p><div class="code-block" data-lang="python"         >
+</div></div></div><ul class="list _ul" id="bc40344d_229"><li class="list__item" id="bc40344d_230"><p>If <span class="control" id="bc40344d_231">cropped is False</span>, the segments are padded with 0s to the original image size. While this can ensure shape consistency, it can consume more memory for large images.</p></li><li class="list__item" id="bc40344d_232"><p>If <span class="control" id="bc40344d_233">cropped is True</span>, the segments are cropped to the minimum bounding box. This can save memory, but the shape of the segments will be inconsistent.</p></li></ul></div></div></section></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><section class="chapter"><h3 id="extract-from-bounds-and-labels" data-toc="extract-from-bounds-and-labels"   >Extract from Bounds and Labels</h3><p id="bc40344d_234">Extract segments from bounds and labels.</p><div class="code-block" data-lang="python"         >
 import numpy as np
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.extract_segments import extract_segments_from_bounds
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 
 segments: list[np.ndarray] = extract_segments_from_bounds(ar, bounds)
-</div></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="extract-from-auto-segmentation" data-toc="extract-from-auto-segmentation"   >Extract from Auto-Segmentation</h3></div><div class="collapse__content"><p id="cfc7b30f_170">Extract segments from a label classification.</p><div class="code-block" data-lang="python"         >
+</div></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="extract-from-auto-segmentation" data-toc="extract-from-auto-segmentation"   >Extract from Auto-Segmentation</h3></div><div class="collapse__content"><p id="bc40344d_236">Extract segments from a label classification.</p><div class="code-block" data-lang="python"         >
 from skimage.morphology import remove_small_objects, remove_small_holes
 import numpy as np
 
-from frdc.load import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.morphology import (
     threshold_binary_mask, binary_watershed
 )
@@ -78,9 +76,7 @@
     extract_segments_from_labels, remove_small_segments_from_labels
 )
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 ar = scale_0_1_per_band(ar)
 ar_mask = threshold_binary_mask(ar, -1, 90 / 256)
@@ -91,4 +87,4 @@
                                               min_height=10, min_width=10)
 
 segments: list[np.ndarray] = extract_segments_from_labels(ar, ar_labels)
-</div><aside class="prompt" data-type="note" data-title="" id="cfc7b30f_172"><p id="cfc7b30f_173">The <code class="code" id="cfc7b30f_174">remove_small_objects</code> and <code class="code" id="cfc7b30f_175">remove_small_holes</code> are used to remove small noise from the binary mask. This is recommended and used in the original paper.</p></aside></div></div></section></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="cfc7b30f_176" data-style="title-top"><dt id="cfc7b30f_177" data-expandable="false">extract_segments_from_labels(ar, ar_labels, cropped)</dt><dd><p><b id="cfc7b30f_178">Extracts segments from a label classification.</b></p><br><p> <code class="code" id="cfc7b30f_180">ar_labels</code> is a label classification as a <code class="code" id="cfc7b30f_181">np.ndarray</code></p></dd><dt id="cfc7b30f_182" data-expandable="false">extract_segments_from_bounds(ar, bounds, cropped)</dt><dd><p><b id="cfc7b30f_183">Extracts segments from <code class="code" id="cfc7b30f_184">Rect</code> bounds.</b></p><br><p> <code class="code" id="cfc7b30f_186">bounds</code> is a list of <code class="code" id="cfc7b30f_187">Rect</code> bounds.</p></dd><dt id="cfc7b30f_188" data-expandable="false">remove_small_segments_from_labels(ar_labels, min_height, min_width)</dt><dd><p><b id="cfc7b30f_189">Removes small segments from a label classification.</b></p><br></dd></dl></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-scale.html">preprocessing.scale</a>   <a class="navigation-links__next" href="preprocessing-morphology.html">preprocessing.morphology</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><aside class="prompt" data-type="note" data-title="" id="bc40344d_238"><p id="bc40344d_239">The <code class="code" id="bc40344d_240">remove_small_objects</code> and <code class="code" id="bc40344d_241">remove_small_holes</code> are used to remove small noise from the binary mask. This is recommended and used in the original paper.</p></aside></div></div></section></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="bc40344d_242" data-style="title-top"><dt id="bc40344d_243" data-expandable="false">extract_segments_from_labels(ar, ar_labels, cropped)</dt><dd><p><b id="bc40344d_244">Extracts segments from a label classification.</b></p><br><p> <code class="code" id="bc40344d_246">ar_labels</code> is a label classification as a <code class="code" id="bc40344d_247">np.ndarray</code></p></dd><dt id="bc40344d_248" data-expandable="false">extract_segments_from_bounds(ar, bounds, cropped)</dt><dd><p><b id="bc40344d_249">Extracts segments from <code class="code" id="bc40344d_250">Rect</code> bounds.</b></p><br><p> <code class="code" id="bc40344d_252">bounds</code> is a list of <code class="code" id="bc40344d_253">Rect</code> bounds.</p></dd><dt id="bc40344d_254" data-expandable="false">remove_small_segments_from_labels(ar_labels, min_height, min_width)</dt><dd><p><b id="bc40344d_255">Removes small segments from a label classification.</b></p><br></dd></dl></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-scale.html">preprocessing.scale</a>   <a class="navigation-links__next" href="preprocessing-morphology.html">preprocessing.morphology</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/preprocessing-glcm-padded.html b/docs/preprocessing-glcm-padded.html
index ff0639fd..f9e3da4c 100644
--- a/docs/preprocessing-glcm-padded.html
+++ b/docs/preprocessing-glcm-padded.html
@@ -1,4 +1,4 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.glcm_padded | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.glcm_padded | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/preprocessing-glcm-padded.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.glcm_padded | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/preprocessing-glcm-padded.html#webpage", "url": "/d/0.0.7/preprocessing-glcm-padded.html", "name": "preprocessing.glcm_padded | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.glcm_padded" data-main-title="preprocessing.glcm_padded" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.glcm_padded"   id="preprocessing.glcm_padded.md">preprocessing.glcm_padded</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;19dba91f_193\&quot;\u003eComputes the GLCM of the NDArray bands with padding.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="tip" data-title="" id="19dba91f_129"><p id="19dba91f_130">This is largely a handy wrapper around my <a href="https://github.com/Eve-ning/glcm-cupy" id="19dba91f_131"   data-external="true" rel="noopener noreferrer" >glcm-cupy</a> package. This auto-computes the necessary padding so that the GLCM is the same size as the original image.</p></aside><aside class="prompt" data-type="warning" data-title="" id="19dba91f_132"><p id="19dba91f_133">The GLCM computation is rather slow, so it is recommended to use it only if necessary.</p></aside><section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><aside class="prompt" data-type="warning" data-title="" id="19dba91f_134"><p>Assumes shape H x W x C, where C is the number of bands.</p></aside><dl id="19dba91f_135" data-style="title-left" data-title-width="medium"><dt id="19dba91f_136" data-expandable="false">glcm_padded</dt><dd><p><b id="19dba91f_137">Computes the GLCM of the NDArray bands with padding.</b></p></dd><dt id="19dba91f_138" data-expandable="false">glcm_padded_cached</dt><dd><p><b id="19dba91f_139">Computes the GLCM of the NDArray bands with padding, and caches it.</b></p></dd><dt id="19dba91f_140" data-expandable="false">append_glcm_padded_cached</dt><dd><p><b id="19dba91f_141">Computes the GLCM of the NDArray bands with padding, and caches it and also appends it onto the original array.</b></p></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="19dba91f_142">We show a few examples of how to use the GLCM functions.</p><div class="code-block" data-lang="python"         >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3916171"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.glcm_padded | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.glcm_padded | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/preprocessing-glcm-padded.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.glcm_padded | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/preprocessing-glcm-padded.html#webpage", "url": "/d/0.0.8/preprocessing-glcm-padded.html", "name": "preprocessing.glcm_padded | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.glcm_padded" data-main-title="preprocessing.glcm_padded" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.glcm_padded"   id="preprocessing.glcm_padded.md">preprocessing.glcm_padded</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;4bf5bd_244\&quot;\u003eComputes the GLCM of the NDArray bands with padding.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="tip" data-title="" id="4bf5bd_180"><p id="4bf5bd_181">This is largely a handy wrapper around my <a href="https://github.com/Eve-ning/glcm-cupy" id="4bf5bd_182"   data-external="true" rel="noopener noreferrer" >glcm-cupy</a> package. This auto-computes the necessary padding so that the GLCM is the same size as the original image.</p></aside><aside class="prompt" data-type="warning" data-title="" id="4bf5bd_183"><p id="4bf5bd_184">The GLCM computation is rather slow, so it is recommended to use it only if necessary.</p></aside><section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><aside class="prompt" data-type="warning" data-title="" id="4bf5bd_185"><p>Assumes shape H x W x C, where C is the number of bands.</p></aside><dl id="4bf5bd_186" data-style="title-left" data-title-width="medium"><dt id="4bf5bd_187" data-expandable="false">glcm_padded</dt><dd><p><b id="4bf5bd_188">Computes the GLCM of the NDArray bands with padding.</b></p></dd><dt id="4bf5bd_189" data-expandable="false">glcm_padded_cached</dt><dd><p><b id="4bf5bd_190">Computes the GLCM of the NDArray bands with padding, and caches it.</b></p></dd><dt id="4bf5bd_191" data-expandable="false">append_glcm_padded_cached</dt><dd><p><b id="4bf5bd_192">Computes the GLCM of the NDArray bands with padding, and caches it and also appends it onto the original array.</b></p></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="4bf5bd_193">We show a few examples of how to use the GLCM functions.</p><div class="code-block" data-lang="python"         >
 import numpy as np
 from glcm_cupy import Features
 
@@ -23,4 +23,4 @@
 ar_glcm_cached_appended = append_glcm_padded_cached(ar, bin_from=1, bin_to=4,
                                                     radius=3)
 
-</div><ul class="list _ul" id="19dba91f_144"><li class="list__item" id="19dba91f_145"><p><code class="code" id="19dba91f_146">ar_glcm</code> is the GLCM of the original array, with the last dimension being the GLCM features. The number of features is determined by the <code class="code" id="19dba91f_147">features</code> parameter, which defaults to all features.</p></li><li class="list__item" id="19dba91f_148"><p><code class="code" id="19dba91f_149">ar_glcm_2_features</code> selects only 2 features, with the last dimension being the 2 GLCM features specified.</p></li><li class="list__item" id="19dba91f_150"><p><code class="code" id="19dba91f_151">ar_glcm_cached</code> caches the GLCM so that if you call it again, it will return the cached version. It stores its data at the project root dir, under <code class="code" id="19dba91f_152">.cache/</code>.</p></li><li class="list__item" id="19dba91f_153"><p><code class="code" id="19dba91f_154">ar_glcm_cached_appended</code> is a wrapper around <code class="code" id="19dba91f_155">ar_glcm_cached</code>, it appends the GLCM features onto the original array. It's equivalent to calling <code class="code" id="19dba91f_156">ar_glcm_cached</code> and then <code class="code" id="19dba91f_157">np.concatenate</code> on the final axes.</p></li></ul><section class="chapter"><h3 id="caching" data-toc="caching"   >Caching</h3><p id="19dba91f_158">GLCM is an expensive operation, thus we recommend to cache it if the input parameters will be the same. This is especially useful if you're experimenting with the same dataset with constant parameters.</p><aside class="prompt" data-type="warning" data-title="" id="19dba91f_159"><p id="19dba91f_160">This cache is automatically invalidated if the parameters change. Thus, if you perform augmentation, the cache will not be used and will be recomputed. This can be wasteful, so it is recommended to perform augmentation after the GLCM computation if possible.</p></aside><aside class="prompt" data-type="note" data-title="" id="19dba91f_161"><p id="19dba91f_162">The cache is stored at the project root dir, under <code class="code" id="19dba91f_163">.cache/</code>. It is safe to delete this folder if you want to clear the cache.</p></aside></section></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="19dba91f_164" data-style="title-top"><dt id="19dba91f_165" data-expandable="false">glcm_padded(ar, bin_from, bin_to, radius, step_size, features)</dt><dd><p><b id="19dba91f_166">Computes the GLCM of the NDArray bands with padding.</b></p><br><ul class="list _ul" id="19dba91f_168"><li class="list__item" id="19dba91f_169"><p><code class="code" id="19dba91f_170">ar</code> is the input array</p></li><li class="list__item" id="19dba91f_171"><p><code class="code" id="19dba91f_172">bin_from</code> is the upper bound of the input</p></li><li class="list__item" id="19dba91f_173"><p><code class="code" id="19dba91f_174">bin_to</code> is the upper bound of the GLCM input, i.e. the resolution that GLCM operates on</p></li><li class="list__item" id="19dba91f_175"><p><code class="code" id="19dba91f_176">radius</code> is the radius of the GLCM</p></li><li class="list__item" id="19dba91f_177"><p><code class="code" id="19dba91f_178">step_size</code> is the step size of the GLCM</p></li><li class="list__item" id="19dba91f_179"><p><code class="code" id="19dba91f_180">features</code> is the list of GLCM features to compute</p></li></ul><p> The return shape is </p><svg xmlns="http://www.w3.org/2000/svg" width="30.394ex" height="1.645ex" role="img" focusable="false" viewBox="0 -705 13434.3 727" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.05ex;"><defs><path id="MJX-2-TEX-I-1D43B" d="M228 637Q194 637 192 641Q191 643 191 649Q191 673 202 682Q204 683 219 683Q260 681 355 681Q389 681 418 681T463 682T483 682Q499 682 499 672Q499 670 497 658Q492 641 487 638H485Q483 638 480 638T473 638T464 637T455 637Q416 636 405 634T387 623Q384 619 355 500Q348 474 340 442T328 395L324 380Q324 378 469 378H614L615 381Q615 384 646 504Q674 619 674 627T617 637Q594 637 587 639T580 648Q580 650 582 660Q586 677 588 679T604 682Q609 682 646 681T740 680Q802 680 835 681T871 682Q888 682 888 672Q888 645 876 638H874Q872 638 869 638T862 638T853 637T844 637Q805 636 794 634T776 623Q773 618 704 340T634 58Q634 51 638 51Q646 48 692 46H723Q729 38 729 37T726 19Q722 6 716 0H701Q664 2 567 2Q533 2 504 2T458 2T437 1Q420 1 420 10Q420 15 423 24Q428 43 433 45Q437 46 448 46H454Q481 46 514 49Q520 50 522 50T528 55T534 64T540 82T547 110T558 153Q565 181 569 198Q602 330 602 331T457 332H312L279 197Q245 63 245 58Q245 51 253 49T303 46H334Q340 38 340 37T337 19Q333 6 327 0H312Q275 2 178 2Q144 2 115 2T69 2T48 1Q31 1 31 10Q31 12 34 24Q39 43 44 45Q48 46 59 46H65Q92 46 125 49Q139 52 144 61Q147 65 216 339T285 628Q285 635 228 637Z"></path><path id="MJX-2-TEX-N-D7" d="M630 29Q630 9 609 9Q604 9 587 25T493 118L389 222L284 117Q178 13 175 11Q171 9 168 9Q160 9 154 15T147 29Q147 36 161 51T255 146L359 250L255 354Q174 435 161 449T147 471Q147 480 153 485T168 490Q173 490 175 489Q178 487 284 383L389 278L493 382Q570 459 587 475T609 491Q630 491 630 471Q630 464 620 453T522 355L418 250L522 145Q606 61 618 48T630 29Z"></path><path id="MJX-2-TEX-I-1D44A" d="M436 683Q450 683 486 682T553 680Q604 680 638 681T677 682Q695 682 695 674Q695 670 692 659Q687 641 683 639T661 637Q636 636 621 632T600 624T597 615Q597 603 613 377T629 138L631 141Q633 144 637 151T649 170T666 200T690 241T720 295T759 362Q863 546 877 572T892 604Q892 619 873 628T831 637Q817 637 817 647Q817 650 819 660Q823 676 825 679T839 682Q842 682 856 682T895 682T949 681Q1015 681 1034 683Q1048 683 1048 672Q1048 666 1045 655T1038 640T1028 637Q1006 637 988 631T958 617T939 600T927 584L923 578L754 282Q586 -14 585 -15Q579 -22 561 -22Q546 -22 542 -17Q539 -14 523 229T506 480L494 462Q472 425 366 239Q222 -13 220 -15T215 -19Q210 -22 197 -22Q178 -22 176 -15Q176 -12 154 304T131 622Q129 631 121 633T82 637H58Q51 644 51 648Q52 671 64 683H76Q118 680 176 680Q301 680 313 683H323Q329 677 329 674T327 656Q322 641 318 637H297Q236 634 232 620Q262 160 266 136L501 550L499 587Q496 629 489 632Q483 636 447 637Q428 637 422 639T416 648Q416 650 418 660Q419 664 420 669T421 676T424 680T428 682T436 683Z"></path><path id="MJX-2-TEX-I-1D436" d="M50 252Q50 367 117 473T286 641T490 704Q580 704 633 653Q642 643 648 636T656 626L657 623Q660 623 684 649Q691 655 699 663T715 679T725 690L740 705H746Q760 705 760 698Q760 694 728 561Q692 422 692 421Q690 416 687 415T669 413H653Q647 419 647 422Q647 423 648 429T650 449T651 481Q651 552 619 605T510 659Q484 659 454 652T382 628T299 572T226 479Q194 422 175 346T156 222Q156 108 232 58Q280 24 350 24Q441 24 512 92T606 240Q610 253 612 255T628 257Q648 257 648 248Q648 243 647 239Q618 132 523 55T319 -22Q206 -22 128 53T50 252Z"></path><path id="MJX-2-TEX-N-47" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q401 658 376 654T316 633T254 592T205 519T177 411Q173 369 173 335Q173 259 192 201T238 111T302 58T370 31T431 24Q478 24 513 45T559 100Q562 110 562 160V212Q561 213 557 216T551 220T542 223T526 225T502 226T463 227H437V273H449L609 270Q715 270 727 273H735V227H721Q674 227 668 215Q666 211 666 108V6Q660 0 657 0Q653 0 639 10Q617 25 600 42L587 54Q571 27 524 3T406 -22Q317 -22 238 22T108 151T56 342Z"></path><path id="MJX-2-TEX-N-4C" d="M128 622Q121 629 117 631T101 634T58 637H25V683H36Q48 680 182 680Q324 680 348 683H360V637H333Q273 637 258 635T233 622L232 342V129Q232 57 237 52Q243 47 313 47Q384 47 410 53Q470 70 498 110T536 221Q536 226 537 238T540 261T542 272T562 273H582V268Q580 265 568 137T554 5V0H25V46H58Q100 47 109 49T128 61V622Z"></path><path id="MJX-2-TEX-N-43" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q322 658 252 588Q173 509 173 342Q173 221 211 151Q232 111 263 84T328 45T384 29T428 24Q517 24 571 93T626 244Q626 251 632 257H660L666 251V236Q661 133 590 56T403 -21Q262 -21 159 83T56 342Z"></path><path id="MJX-2-TEX-N-4D" d="M132 622Q125 629 121 631T105 634T62 637H29V683H135Q221 683 232 682T249 675Q250 674 354 398L458 124L562 398Q666 674 668 675Q671 681 683 682T781 683H887V637H854Q814 636 803 634T785 622V61Q791 51 802 49T854 46H887V0H876Q855 3 736 3Q605 3 596 0H585V46H618Q660 47 669 49T688 61V347Q688 424 688 461T688 546T688 613L687 632Q454 14 450 7Q446 1 430 1T410 7Q409 9 292 316L176 624V606Q175 588 175 543T175 463T175 356L176 86Q187 50 261 46H278V0H269Q254 3 154 3Q52 3 37 0H29V46H46Q78 48 98 56T122 69T132 86V622Z"></path><path id="MJX-2-TEX-N-20" d=""></path><path id="MJX-2-TEX-N-46" d="M128 619Q121 626 117 628T101 631T58 634H25V680H582V676Q584 670 596 560T610 444V440H570V444Q563 493 561 501Q555 538 543 563T516 601T477 622T431 631T374 633H334H286Q252 633 244 631T233 621Q232 619 232 490V363H284Q287 363 303 363T327 364T349 367T372 373T389 385Q407 403 410 459V480H450V200H410V221Q407 276 389 296Q381 303 371 307T348 313T327 316T303 317T284 317H232V189L233 61Q240 54 245 52T270 48T333 46H360V0H348Q324 3 182 3Q51 3 36 0H25V46H58Q100 47 109 49T128 61V619Z"></path><path id="MJX-2-TEX-N-65" d="M28 218Q28 273 48 318T98 391T163 433T229 448Q282 448 320 430T378 380T406 316T415 245Q415 238 408 231H126V216Q126 68 226 36Q246 30 270 30Q312 30 342 62Q359 79 369 104L379 128Q382 131 395 131H398Q415 131 415 121Q415 117 412 108Q393 53 349 21T250 -11Q155 -11 92 58T28 218ZM333 275Q322 403 238 411H236Q228 411 220 410T195 402T166 381T143 340T127 274V267H333V275Z"></path><path id="MJX-2-TEX-N-61" d="M137 305T115 305T78 320T63 359Q63 394 97 421T218 448Q291 448 336 416T396 340Q401 326 401 309T402 194V124Q402 76 407 58T428 40Q443 40 448 56T453 109V145H493V106Q492 66 490 59Q481 29 455 12T400 -6T353 12T329 54V58L327 55Q325 52 322 49T314 40T302 29T287 17T269 6T247 -2T221 -8T190 -11Q130 -11 82 20T34 107Q34 128 41 147T68 188T116 225T194 253T304 268H318V290Q318 324 312 340Q290 411 215 411Q197 411 181 410T156 406T148 403Q170 388 170 359Q170 334 154 320ZM126 106Q126 75 150 51T209 26Q247 26 276 49T315 109Q317 116 318 175Q318 233 317 233Q309 233 296 232T251 223T193 203T147 166T126 106Z"></path><path id="MJX-2-TEX-N-74" d="M27 422Q80 426 109 478T141 600V615H181V431H316V385H181V241Q182 116 182 100T189 68Q203 29 238 29Q282 29 292 100Q293 108 293 146V181H333V146V134Q333 57 291 17Q264 -10 221 -10Q187 -10 162 2T124 33T105 68T98 100Q97 107 97 248V385H18V422H27Z"></path><path id="MJX-2-TEX-N-75" d="M383 58Q327 -10 256 -10H249Q124 -10 105 89Q104 96 103 226Q102 335 102 348T96 369Q86 385 36 385H25V408Q25 431 27 431L38 432Q48 433 67 434T105 436Q122 437 142 438T172 441T184 442H187V261Q188 77 190 64Q193 49 204 40Q224 26 264 26Q290 26 311 35T343 58T363 90T375 120T379 144Q379 145 379 161T380 201T380 248V315Q380 361 370 372T320 385H302V431Q304 431 378 436T457 442H464V264Q464 84 465 81Q468 61 479 55T524 46H542V0Q540 0 467 -5T390 -11H383V58Z"></path><path id="MJX-2-TEX-N-72" d="M36 46H50Q89 46 97 60V68Q97 77 97 91T98 122T98 161T98 203Q98 234 98 269T98 328L97 351Q94 370 83 376T38 385H20V408Q20 431 22 431L32 432Q42 433 60 434T96 436Q112 437 131 438T160 441T171 442H174V373Q213 441 271 441H277Q322 441 343 419T364 373Q364 352 351 337T313 322Q288 322 276 338T263 372Q263 381 265 388T270 400T273 405Q271 407 250 401Q234 393 226 386Q179 341 179 207V154Q179 141 179 127T179 101T180 81T180 66V61Q181 59 183 57T188 54T193 51T200 49T207 48T216 47T225 47T235 46T245 46H276V0H267Q249 3 140 3Q37 3 28 0H20V46H36Z"></path><path id="MJX-2-TEX-N-73" d="M295 316Q295 356 268 385T190 414Q154 414 128 401Q98 382 98 349Q97 344 98 336T114 312T157 287Q175 282 201 278T245 269T277 256Q294 248 310 236T342 195T359 133Q359 71 321 31T198 -10H190Q138 -10 94 26L86 19L77 10Q71 4 65 -1L54 -11H46H42Q39 -11 33 -5V74V132Q33 153 35 157T45 162H54Q66 162 70 158T75 146T82 119T101 77Q136 26 198 26Q295 26 295 104Q295 133 277 151Q257 175 194 187T111 210Q75 227 54 256T33 318Q33 357 50 384T93 424T143 442T187 447H198Q238 447 268 432L283 424L292 431Q302 440 314 448H322H326Q329 448 335 442V310L329 304H301Q295 310 295 316Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mi"><use data-c="1D43B" xlink:href="#MJX-2-TEX-I-1D43B"></use></g><g data-mml-node="mo" transform="translate(1110.2,0)"><use data-c="D7" xlink:href="#MJX-2-TEX-N-D7"></use></g><g data-mml-node="mi" transform="translate(2110.4,0)"><use data-c="1D44A" xlink:href="#MJX-2-TEX-I-1D44A"></use></g><g data-mml-node="mo" transform="translate(3380.7,0)"><use data-c="D7" xlink:href="#MJX-2-TEX-N-D7"></use></g><g data-mml-node="mi" transform="translate(4380.9,0)"><use data-c="1D436" xlink:href="#MJX-2-TEX-I-1D436"></use></g><g data-mml-node="mo" transform="translate(5363.1,0)"><use data-c="D7" xlink:href="#MJX-2-TEX-N-D7"></use></g><g data-mml-node="mtext" transform="translate(6363.3,0)"><use data-c="47" xlink:href="#MJX-2-TEX-N-47"></use><use data-c="4C" xlink:href="#MJX-2-TEX-N-4C" transform="translate(785,0)"></use><use data-c="43" xlink:href="#MJX-2-TEX-N-43" transform="translate(1410,0)"></use><use data-c="4D" xlink:href="#MJX-2-TEX-N-4D" transform="translate(2132,0)"></use><use data-c="20" xlink:href="#MJX-2-TEX-N-20" transform="translate(3049,0)"></use><use data-c="46" xlink:href="#MJX-2-TEX-N-46" transform="translate(3299,0)"></use><use data-c="65" xlink:href="#MJX-2-TEX-N-65" transform="translate(3952,0)"></use><use data-c="61" xlink:href="#MJX-2-TEX-N-61" transform="translate(4396,0)"></use><use data-c="74" xlink:href="#MJX-2-TEX-N-74" transform="translate(4896,0)"></use><use data-c="75" xlink:href="#MJX-2-TEX-N-75" transform="translate(5285,0)"></use><use data-c="72" xlink:href="#MJX-2-TEX-N-72" transform="translate(5841,0)"></use><use data-c="65" xlink:href="#MJX-2-TEX-N-65" transform="translate(6233,0)"></use><use data-c="73" xlink:href="#MJX-2-TEX-N-73" transform="translate(6677,0)"></use></g></g></g></svg><p> See <code class="code" id="19dba91f_182">glcm_cupy</code> for the GLCM Features.</p></dd><dt id="19dba91f_183" data-expandable="false">glcm_padded_cached(ar, bin_from, bin_to, radius, step_size, features)</dt><dd><p><b id="19dba91f_184">Computes the GLCM of the NDArray bands with padding, and caches it.</b></p><br><p> See <code class="code" id="19dba91f_186">glcm_padded</code> for the parameters and output shape</p></dd><dt id="19dba91f_187" data-expandable="false">append_glcm_padded_cached(ar, bin_from, bin_to, radius, step_size, features)</dt><dd><p><b id="19dba91f_188">Computes the GLCM of the NDArray bands with padding, and caches it and also appends it onto the original array.</b></p><br><p> See <code class="code" id="19dba91f_190">glcm_padded</code> for the parameters</p><br><p> The return shape is: </p><svg xmlns="http://www.w3.org/2000/svg" width="36.64ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 16194.8 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-4-TEX-I-1D43B" d="M228 637Q194 637 192 641Q191 643 191 649Q191 673 202 682Q204 683 219 683Q260 681 355 681Q389 681 418 681T463 682T483 682Q499 682 499 672Q499 670 497 658Q492 641 487 638H485Q483 638 480 638T473 638T464 637T455 637Q416 636 405 634T387 623Q384 619 355 500Q348 474 340 442T328 395L324 380Q324 378 469 378H614L615 381Q615 384 646 504Q674 619 674 627T617 637Q594 637 587 639T580 648Q580 650 582 660Q586 677 588 679T604 682Q609 682 646 681T740 680Q802 680 835 681T871 682Q888 682 888 672Q888 645 876 638H874Q872 638 869 638T862 638T853 637T844 637Q805 636 794 634T776 623Q773 618 704 340T634 58Q634 51 638 51Q646 48 692 46H723Q729 38 729 37T726 19Q722 6 716 0H701Q664 2 567 2Q533 2 504 2T458 2T437 1Q420 1 420 10Q420 15 423 24Q428 43 433 45Q437 46 448 46H454Q481 46 514 49Q520 50 522 50T528 55T534 64T540 82T547 110T558 153Q565 181 569 198Q602 330 602 331T457 332H312L279 197Q245 63 245 58Q245 51 253 49T303 46H334Q340 38 340 37T337 19Q333 6 327 0H312Q275 2 178 2Q144 2 115 2T69 2T48 1Q31 1 31 10Q31 12 34 24Q39 43 44 45Q48 46 59 46H65Q92 46 125 49Q139 52 144 61Q147 65 216 339T285 628Q285 635 228 637Z"></path><path id="MJX-4-TEX-N-D7" d="M630 29Q630 9 609 9Q604 9 587 25T493 118L389 222L284 117Q178 13 175 11Q171 9 168 9Q160 9 154 15T147 29Q147 36 161 51T255 146L359 250L255 354Q174 435 161 449T147 471Q147 480 153 485T168 490Q173 490 175 489Q178 487 284 383L389 278L493 382Q570 459 587 475T609 491Q630 491 630 471Q630 464 620 453T522 355L418 250L522 145Q606 61 618 48T630 29Z"></path><path id="MJX-4-TEX-I-1D44A" d="M436 683Q450 683 486 682T553 680Q604 680 638 681T677 682Q695 682 695 674Q695 670 692 659Q687 641 683 639T661 637Q636 636 621 632T600 624T597 615Q597 603 613 377T629 138L631 141Q633 144 637 151T649 170T666 200T690 241T720 295T759 362Q863 546 877 572T892 604Q892 619 873 628T831 637Q817 637 817 647Q817 650 819 660Q823 676 825 679T839 682Q842 682 856 682T895 682T949 681Q1015 681 1034 683Q1048 683 1048 672Q1048 666 1045 655T1038 640T1028 637Q1006 637 988 631T958 617T939 600T927 584L923 578L754 282Q586 -14 585 -15Q579 -22 561 -22Q546 -22 542 -17Q539 -14 523 229T506 480L494 462Q472 425 366 239Q222 -13 220 -15T215 -19Q210 -22 197 -22Q178 -22 176 -15Q176 -12 154 304T131 622Q129 631 121 633T82 637H58Q51 644 51 648Q52 671 64 683H76Q118 680 176 680Q301 680 313 683H323Q329 677 329 674T327 656Q322 641 318 637H297Q236 634 232 620Q262 160 266 136L501 550L499 587Q496 629 489 632Q483 636 447 637Q428 637 422 639T416 648Q416 650 418 660Q419 664 420 669T421 676T424 680T428 682T436 683Z"></path><path id="MJX-4-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-4-TEX-I-1D436" d="M50 252Q50 367 117 473T286 641T490 704Q580 704 633 653Q642 643 648 636T656 626L657 623Q660 623 684 649Q691 655 699 663T715 679T725 690L740 705H746Q760 705 760 698Q760 694 728 561Q692 422 692 421Q690 416 687 415T669 413H653Q647 419 647 422Q647 423 648 429T650 449T651 481Q651 552 619 605T510 659Q484 659 454 652T382 628T299 572T226 479Q194 422 175 346T156 222Q156 108 232 58Q280 24 350 24Q441 24 512 92T606 240Q610 253 612 255T628 257Q648 257 648 248Q648 243 647 239Q618 132 523 55T319 -22Q206 -22 128 53T50 252Z"></path><path id="MJX-4-TEX-N-47" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q401 658 376 654T316 633T254 592T205 519T177 411Q173 369 173 335Q173 259 192 201T238 111T302 58T370 31T431 24Q478 24 513 45T559 100Q562 110 562 160V212Q561 213 557 216T551 220T542 223T526 225T502 226T463 227H437V273H449L609 270Q715 270 727 273H735V227H721Q674 227 668 215Q666 211 666 108V6Q660 0 657 0Q653 0 639 10Q617 25 600 42L587 54Q571 27 524 3T406 -22Q317 -22 238 22T108 151T56 342Z"></path><path id="MJX-4-TEX-N-4C" d="M128 622Q121 629 117 631T101 634T58 637H25V683H36Q48 680 182 680Q324 680 348 683H360V637H333Q273 637 258 635T233 622L232 342V129Q232 57 237 52Q243 47 313 47Q384 47 410 53Q470 70 498 110T536 221Q536 226 537 238T540 261T542 272T562 273H582V268Q580 265 568 137T554 5V0H25V46H58Q100 47 109 49T128 61V622Z"></path><path id="MJX-4-TEX-N-43" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q322 658 252 588Q173 509 173 342Q173 221 211 151Q232 111 263 84T328 45T384 29T428 24Q517 24 571 93T626 244Q626 251 632 257H660L666 251V236Q661 133 590 56T403 -21Q262 -21 159 83T56 342Z"></path><path id="MJX-4-TEX-N-4D" d="M132 622Q125 629 121 631T105 634T62 637H29V683H135Q221 683 232 682T249 675Q250 674 354 398L458 124L562 398Q666 674 668 675Q671 681 683 682T781 683H887V637H854Q814 636 803 634T785 622V61Q791 51 802 49T854 46H887V0H876Q855 3 736 3Q605 3 596 0H585V46H618Q660 47 669 49T688 61V347Q688 424 688 461T688 546T688 613L687 632Q454 14 450 7Q446 1 430 1T410 7Q409 9 292 316L176 624V606Q175 588 175 543T175 463T175 356L176 86Q187 50 261 46H278V0H269Q254 3 154 3Q52 3 37 0H29V46H46Q78 48 98 56T122 69T132 86V622Z"></path><path id="MJX-4-TEX-N-20" d=""></path><path id="MJX-4-TEX-N-46" d="M128 619Q121 626 117 628T101 631T58 634H25V680H582V676Q584 670 596 560T610 444V440H570V444Q563 493 561 501Q555 538 543 563T516 601T477 622T431 631T374 633H334H286Q252 633 244 631T233 621Q232 619 232 490V363H284Q287 363 303 363T327 364T349 367T372 373T389 385Q407 403 410 459V480H450V200H410V221Q407 276 389 296Q381 303 371 307T348 313T327 316T303 317T284 317H232V189L233 61Q240 54 245 52T270 48T333 46H360V0H348Q324 3 182 3Q51 3 36 0H25V46H58Q100 47 109 49T128 61V619Z"></path><path id="MJX-4-TEX-N-65" d="M28 218Q28 273 48 318T98 391T163 433T229 448Q282 448 320 430T378 380T406 316T415 245Q415 238 408 231H126V216Q126 68 226 36Q246 30 270 30Q312 30 342 62Q359 79 369 104L379 128Q382 131 395 131H398Q415 131 415 121Q415 117 412 108Q393 53 349 21T250 -11Q155 -11 92 58T28 218ZM333 275Q322 403 238 411H236Q228 411 220 410T195 402T166 381T143 340T127 274V267H333V275Z"></path><path id="MJX-4-TEX-N-61" d="M137 305T115 305T78 320T63 359Q63 394 97 421T218 448Q291 448 336 416T396 340Q401 326 401 309T402 194V124Q402 76 407 58T428 40Q443 40 448 56T453 109V145H493V106Q492 66 490 59Q481 29 455 12T400 -6T353 12T329 54V58L327 55Q325 52 322 49T314 40T302 29T287 17T269 6T247 -2T221 -8T190 -11Q130 -11 82 20T34 107Q34 128 41 147T68 188T116 225T194 253T304 268H318V290Q318 324 312 340Q290 411 215 411Q197 411 181 410T156 406T148 403Q170 388 170 359Q170 334 154 320ZM126 106Q126 75 150 51T209 26Q247 26 276 49T315 109Q317 116 318 175Q318 233 317 233Q309 233 296 232T251 223T193 203T147 166T126 106Z"></path><path id="MJX-4-TEX-N-74" d="M27 422Q80 426 109 478T141 600V615H181V431H316V385H181V241Q182 116 182 100T189 68Q203 29 238 29Q282 29 292 100Q293 108 293 146V181H333V146V134Q333 57 291 17Q264 -10 221 -10Q187 -10 162 2T124 33T105 68T98 100Q97 107 97 248V385H18V422H27Z"></path><path id="MJX-4-TEX-N-75" d="M383 58Q327 -10 256 -10H249Q124 -10 105 89Q104 96 103 226Q102 335 102 348T96 369Q86 385 36 385H25V408Q25 431 27 431L38 432Q48 433 67 434T105 436Q122 437 142 438T172 441T184 442H187V261Q188 77 190 64Q193 49 204 40Q224 26 264 26Q290 26 311 35T343 58T363 90T375 120T379 144Q379 145 379 161T380 201T380 248V315Q380 361 370 372T320 385H302V431Q304 431 378 436T457 442H464V264Q464 84 465 81Q468 61 479 55T524 46H542V0Q540 0 467 -5T390 -11H383V58Z"></path><path id="MJX-4-TEX-N-72" d="M36 46H50Q89 46 97 60V68Q97 77 97 91T98 122T98 161T98 203Q98 234 98 269T98 328L97 351Q94 370 83 376T38 385H20V408Q20 431 22 431L32 432Q42 433 60 434T96 436Q112 437 131 438T160 441T171 442H174V373Q213 441 271 441H277Q322 441 343 419T364 373Q364 352 351 337T313 322Q288 322 276 338T263 372Q263 381 265 388T270 400T273 405Q271 407 250 401Q234 393 226 386Q179 341 179 207V154Q179 141 179 127T179 101T180 81T180 66V61Q181 59 183 57T188 54T193 51T200 49T207 48T216 47T225 47T235 46T245 46H276V0H267Q249 3 140 3Q37 3 28 0H20V46H36Z"></path><path id="MJX-4-TEX-N-73" d="M295 316Q295 356 268 385T190 414Q154 414 128 401Q98 382 98 349Q97 344 98 336T114 312T157 287Q175 282 201 278T245 269T277 256Q294 248 310 236T342 195T359 133Q359 71 321 31T198 -10H190Q138 -10 94 26L86 19L77 10Q71 4 65 -1L54 -11H46H42Q39 -11 33 -5V74V132Q33 153 35 157T45 162H54Q66 162 70 158T75 146T82 119T101 77Q136 26 198 26Q295 26 295 104Q295 133 277 151Q257 175 194 187T111 210Q75 227 54 256T33 318Q33 357 50 384T93 424T143 442T187 447H198Q238 447 268 432L283 424L292 431Q302 440 314 448H322H326Q329 448 335 442V310L329 304H301Q295 310 295 316Z"></path><path id="MJX-4-TEX-N-2B" d="M56 237T56 250T70 270H369V420L370 570Q380 583 389 583Q402 583 409 568V270H707Q722 262 722 250T707 230H409V-68Q401 -82 391 -82H389H387Q375 -82 369 -68V230H70Q56 237 56 250Z"></path><path id="MJX-4-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mi"><use data-c="1D43B" xlink:href="#MJX-4-TEX-I-1D43B"></use></g><g data-mml-node="mo" transform="translate(1110.2,0)"><use data-c="D7" xlink:href="#MJX-4-TEX-N-D7"></use></g><g data-mml-node="mi" transform="translate(2110.4,0)"><use data-c="1D44A" xlink:href="#MJX-4-TEX-I-1D44A"></use></g><g data-mml-node="mo" transform="translate(3380.7,0)"><use data-c="D7" xlink:href="#MJX-4-TEX-N-D7"></use></g><g data-mml-node="mo" transform="translate(4380.9,0)"><use data-c="28" xlink:href="#MJX-4-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(4769.9,0)"><use data-c="1D436" xlink:href="#MJX-4-TEX-I-1D436"></use></g><g data-mml-node="mo" transform="translate(5752.1,0)"><use data-c="D7" xlink:href="#MJX-4-TEX-N-D7"></use></g><g data-mml-node="mtext" transform="translate(6752.3,0)"><use data-c="47" xlink:href="#MJX-4-TEX-N-47"></use><use data-c="4C" xlink:href="#MJX-4-TEX-N-4C" transform="translate(785,0)"></use><use data-c="43" xlink:href="#MJX-4-TEX-N-43" transform="translate(1410,0)"></use><use data-c="4D" xlink:href="#MJX-4-TEX-N-4D" transform="translate(2132,0)"></use><use data-c="20" xlink:href="#MJX-4-TEX-N-20" transform="translate(3049,0)"></use><use data-c="46" xlink:href="#MJX-4-TEX-N-46" transform="translate(3299,0)"></use><use data-c="65" xlink:href="#MJX-4-TEX-N-65" transform="translate(3952,0)"></use><use data-c="61" xlink:href="#MJX-4-TEX-N-61" transform="translate(4396,0)"></use><use data-c="74" xlink:href="#MJX-4-TEX-N-74" transform="translate(4896,0)"></use><use data-c="75" xlink:href="#MJX-4-TEX-N-75" transform="translate(5285,0)"></use><use data-c="72" xlink:href="#MJX-4-TEX-N-72" transform="translate(5841,0)"></use><use data-c="65" xlink:href="#MJX-4-TEX-N-65" transform="translate(6233,0)"></use><use data-c="73" xlink:href="#MJX-4-TEX-N-73" transform="translate(6677,0)"></use></g><g data-mml-node="mo" transform="translate(14045.6,0)"><use data-c="2B" xlink:href="#MJX-4-TEX-N-2B"></use></g><g data-mml-node="mi" transform="translate(15045.8,0)"><use data-c="1D436" xlink:href="#MJX-4-TEX-I-1D436"></use></g><g data-mml-node="mo" transform="translate(15805.8,0)"><use data-c="29" xlink:href="#MJX-4-TEX-N-29"></use></g></g></g></svg><p> The function automatically flattens the last 2 dimensions of the GLCM features, and appends it onto the original array.</p></dd></dl></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-morphology.html">preprocessing.morphology</a>   <a class="navigation-links__next" href="train-frdc-lightning.html">train.frdc_datamodule &amp; frdc_module</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><ul class="list _ul" id="4bf5bd_195"><li class="list__item" id="4bf5bd_196"><p><code class="code" id="4bf5bd_197">ar_glcm</code> is the GLCM of the original array, with the last dimension being the GLCM features. The number of features is determined by the <code class="code" id="4bf5bd_198">features</code> parameter, which defaults to all features.</p></li><li class="list__item" id="4bf5bd_199"><p><code class="code" id="4bf5bd_200">ar_glcm_2_features</code> selects only 2 features, with the last dimension being the 2 GLCM features specified.</p></li><li class="list__item" id="4bf5bd_201"><p><code class="code" id="4bf5bd_202">ar_glcm_cached</code> caches the GLCM so that if you call it again, it will return the cached version. It stores its data at the project root dir, under <code class="code" id="4bf5bd_203">.cache/</code>.</p></li><li class="list__item" id="4bf5bd_204"><p><code class="code" id="4bf5bd_205">ar_glcm_cached_appended</code> is a wrapper around <code class="code" id="4bf5bd_206">ar_glcm_cached</code>, it appends the GLCM features onto the original array. It's equivalent to calling <code class="code" id="4bf5bd_207">ar_glcm_cached</code> and then <code class="code" id="4bf5bd_208">np.concatenate</code> on the final axes.</p></li></ul><section class="chapter"><h3 id="caching" data-toc="caching"   >Caching</h3><p id="4bf5bd_209">GLCM is an expensive operation, thus we recommend to cache it if the input parameters will be the same. This is especially useful if you're experimenting with the same dataset with constant parameters.</p><aside class="prompt" data-type="warning" data-title="" id="4bf5bd_210"><p id="4bf5bd_211">This cache is automatically invalidated if the parameters change. Thus, if you perform augmentation, the cache will not be used and will be recomputed. This can be wasteful, so it is recommended to perform augmentation after the GLCM computation if possible.</p></aside><aside class="prompt" data-type="note" data-title="" id="4bf5bd_212"><p id="4bf5bd_213">The cache is stored at the project root dir, under <code class="code" id="4bf5bd_214">.cache/</code>. It is safe to delete this folder if you want to clear the cache.</p></aside></section></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="4bf5bd_215" data-style="title-top"><dt id="4bf5bd_216" data-expandable="false">glcm_padded(ar, bin_from, bin_to, radius, step_size, features)</dt><dd><p><b id="4bf5bd_217">Computes the GLCM of the NDArray bands with padding.</b></p><br><ul class="list _ul" id="4bf5bd_219"><li class="list__item" id="4bf5bd_220"><p><code class="code" id="4bf5bd_221">ar</code> is the input array</p></li><li class="list__item" id="4bf5bd_222"><p><code class="code" id="4bf5bd_223">bin_from</code> is the upper bound of the input</p></li><li class="list__item" id="4bf5bd_224"><p><code class="code" id="4bf5bd_225">bin_to</code> is the upper bound of the GLCM input, i.e. the resolution that GLCM operates on</p></li><li class="list__item" id="4bf5bd_226"><p><code class="code" id="4bf5bd_227">radius</code> is the radius of the GLCM</p></li><li class="list__item" id="4bf5bd_228"><p><code class="code" id="4bf5bd_229">step_size</code> is the step size of the GLCM</p></li><li class="list__item" id="4bf5bd_230"><p><code class="code" id="4bf5bd_231">features</code> is the list of GLCM features to compute</p></li></ul><p> The return shape is </p><svg xmlns="http://www.w3.org/2000/svg" width="30.394ex" height="1.645ex" role="img" focusable="false" viewBox="0 -705 13434.3 727" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.05ex;"><defs><path id="MJX-2-TEX-I-1D43B" d="M228 637Q194 637 192 641Q191 643 191 649Q191 673 202 682Q204 683 219 683Q260 681 355 681Q389 681 418 681T463 682T483 682Q499 682 499 672Q499 670 497 658Q492 641 487 638H485Q483 638 480 638T473 638T464 637T455 637Q416 636 405 634T387 623Q384 619 355 500Q348 474 340 442T328 395L324 380Q324 378 469 378H614L615 381Q615 384 646 504Q674 619 674 627T617 637Q594 637 587 639T580 648Q580 650 582 660Q586 677 588 679T604 682Q609 682 646 681T740 680Q802 680 835 681T871 682Q888 682 888 672Q888 645 876 638H874Q872 638 869 638T862 638T853 637T844 637Q805 636 794 634T776 623Q773 618 704 340T634 58Q634 51 638 51Q646 48 692 46H723Q729 38 729 37T726 19Q722 6 716 0H701Q664 2 567 2Q533 2 504 2T458 2T437 1Q420 1 420 10Q420 15 423 24Q428 43 433 45Q437 46 448 46H454Q481 46 514 49Q520 50 522 50T528 55T534 64T540 82T547 110T558 153Q565 181 569 198Q602 330 602 331T457 332H312L279 197Q245 63 245 58Q245 51 253 49T303 46H334Q340 38 340 37T337 19Q333 6 327 0H312Q275 2 178 2Q144 2 115 2T69 2T48 1Q31 1 31 10Q31 12 34 24Q39 43 44 45Q48 46 59 46H65Q92 46 125 49Q139 52 144 61Q147 65 216 339T285 628Q285 635 228 637Z"></path><path id="MJX-2-TEX-N-D7" d="M630 29Q630 9 609 9Q604 9 587 25T493 118L389 222L284 117Q178 13 175 11Q171 9 168 9Q160 9 154 15T147 29Q147 36 161 51T255 146L359 250L255 354Q174 435 161 449T147 471Q147 480 153 485T168 490Q173 490 175 489Q178 487 284 383L389 278L493 382Q570 459 587 475T609 491Q630 491 630 471Q630 464 620 453T522 355L418 250L522 145Q606 61 618 48T630 29Z"></path><path id="MJX-2-TEX-I-1D44A" d="M436 683Q450 683 486 682T553 680Q604 680 638 681T677 682Q695 682 695 674Q695 670 692 659Q687 641 683 639T661 637Q636 636 621 632T600 624T597 615Q597 603 613 377T629 138L631 141Q633 144 637 151T649 170T666 200T690 241T720 295T759 362Q863 546 877 572T892 604Q892 619 873 628T831 637Q817 637 817 647Q817 650 819 660Q823 676 825 679T839 682Q842 682 856 682T895 682T949 681Q1015 681 1034 683Q1048 683 1048 672Q1048 666 1045 655T1038 640T1028 637Q1006 637 988 631T958 617T939 600T927 584L923 578L754 282Q586 -14 585 -15Q579 -22 561 -22Q546 -22 542 -17Q539 -14 523 229T506 480L494 462Q472 425 366 239Q222 -13 220 -15T215 -19Q210 -22 197 -22Q178 -22 176 -15Q176 -12 154 304T131 622Q129 631 121 633T82 637H58Q51 644 51 648Q52 671 64 683H76Q118 680 176 680Q301 680 313 683H323Q329 677 329 674T327 656Q322 641 318 637H297Q236 634 232 620Q262 160 266 136L501 550L499 587Q496 629 489 632Q483 636 447 637Q428 637 422 639T416 648Q416 650 418 660Q419 664 420 669T421 676T424 680T428 682T436 683Z"></path><path id="MJX-2-TEX-I-1D436" d="M50 252Q50 367 117 473T286 641T490 704Q580 704 633 653Q642 643 648 636T656 626L657 623Q660 623 684 649Q691 655 699 663T715 679T725 690L740 705H746Q760 705 760 698Q760 694 728 561Q692 422 692 421Q690 416 687 415T669 413H653Q647 419 647 422Q647 423 648 429T650 449T651 481Q651 552 619 605T510 659Q484 659 454 652T382 628T299 572T226 479Q194 422 175 346T156 222Q156 108 232 58Q280 24 350 24Q441 24 512 92T606 240Q610 253 612 255T628 257Q648 257 648 248Q648 243 647 239Q618 132 523 55T319 -22Q206 -22 128 53T50 252Z"></path><path id="MJX-2-TEX-N-47" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q401 658 376 654T316 633T254 592T205 519T177 411Q173 369 173 335Q173 259 192 201T238 111T302 58T370 31T431 24Q478 24 513 45T559 100Q562 110 562 160V212Q561 213 557 216T551 220T542 223T526 225T502 226T463 227H437V273H449L609 270Q715 270 727 273H735V227H721Q674 227 668 215Q666 211 666 108V6Q660 0 657 0Q653 0 639 10Q617 25 600 42L587 54Q571 27 524 3T406 -22Q317 -22 238 22T108 151T56 342Z"></path><path id="MJX-2-TEX-N-4C" d="M128 622Q121 629 117 631T101 634T58 637H25V683H36Q48 680 182 680Q324 680 348 683H360V637H333Q273 637 258 635T233 622L232 342V129Q232 57 237 52Q243 47 313 47Q384 47 410 53Q470 70 498 110T536 221Q536 226 537 238T540 261T542 272T562 273H582V268Q580 265 568 137T554 5V0H25V46H58Q100 47 109 49T128 61V622Z"></path><path id="MJX-2-TEX-N-43" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q322 658 252 588Q173 509 173 342Q173 221 211 151Q232 111 263 84T328 45T384 29T428 24Q517 24 571 93T626 244Q626 251 632 257H660L666 251V236Q661 133 590 56T403 -21Q262 -21 159 83T56 342Z"></path><path id="MJX-2-TEX-N-4D" d="M132 622Q125 629 121 631T105 634T62 637H29V683H135Q221 683 232 682T249 675Q250 674 354 398L458 124L562 398Q666 674 668 675Q671 681 683 682T781 683H887V637H854Q814 636 803 634T785 622V61Q791 51 802 49T854 46H887V0H876Q855 3 736 3Q605 3 596 0H585V46H618Q660 47 669 49T688 61V347Q688 424 688 461T688 546T688 613L687 632Q454 14 450 7Q446 1 430 1T410 7Q409 9 292 316L176 624V606Q175 588 175 543T175 463T175 356L176 86Q187 50 261 46H278V0H269Q254 3 154 3Q52 3 37 0H29V46H46Q78 48 98 56T122 69T132 86V622Z"></path><path id="MJX-2-TEX-N-20" d=""></path><path id="MJX-2-TEX-N-46" d="M128 619Q121 626 117 628T101 631T58 634H25V680H582V676Q584 670 596 560T610 444V440H570V444Q563 493 561 501Q555 538 543 563T516 601T477 622T431 631T374 633H334H286Q252 633 244 631T233 621Q232 619 232 490V363H284Q287 363 303 363T327 364T349 367T372 373T389 385Q407 403 410 459V480H450V200H410V221Q407 276 389 296Q381 303 371 307T348 313T327 316T303 317T284 317H232V189L233 61Q240 54 245 52T270 48T333 46H360V0H348Q324 3 182 3Q51 3 36 0H25V46H58Q100 47 109 49T128 61V619Z"></path><path id="MJX-2-TEX-N-65" d="M28 218Q28 273 48 318T98 391T163 433T229 448Q282 448 320 430T378 380T406 316T415 245Q415 238 408 231H126V216Q126 68 226 36Q246 30 270 30Q312 30 342 62Q359 79 369 104L379 128Q382 131 395 131H398Q415 131 415 121Q415 117 412 108Q393 53 349 21T250 -11Q155 -11 92 58T28 218ZM333 275Q322 403 238 411H236Q228 411 220 410T195 402T166 381T143 340T127 274V267H333V275Z"></path><path id="MJX-2-TEX-N-61" d="M137 305T115 305T78 320T63 359Q63 394 97 421T218 448Q291 448 336 416T396 340Q401 326 401 309T402 194V124Q402 76 407 58T428 40Q443 40 448 56T453 109V145H493V106Q492 66 490 59Q481 29 455 12T400 -6T353 12T329 54V58L327 55Q325 52 322 49T314 40T302 29T287 17T269 6T247 -2T221 -8T190 -11Q130 -11 82 20T34 107Q34 128 41 147T68 188T116 225T194 253T304 268H318V290Q318 324 312 340Q290 411 215 411Q197 411 181 410T156 406T148 403Q170 388 170 359Q170 334 154 320ZM126 106Q126 75 150 51T209 26Q247 26 276 49T315 109Q317 116 318 175Q318 233 317 233Q309 233 296 232T251 223T193 203T147 166T126 106Z"></path><path id="MJX-2-TEX-N-74" d="M27 422Q80 426 109 478T141 600V615H181V431H316V385H181V241Q182 116 182 100T189 68Q203 29 238 29Q282 29 292 100Q293 108 293 146V181H333V146V134Q333 57 291 17Q264 -10 221 -10Q187 -10 162 2T124 33T105 68T98 100Q97 107 97 248V385H18V422H27Z"></path><path id="MJX-2-TEX-N-75" d="M383 58Q327 -10 256 -10H249Q124 -10 105 89Q104 96 103 226Q102 335 102 348T96 369Q86 385 36 385H25V408Q25 431 27 431L38 432Q48 433 67 434T105 436Q122 437 142 438T172 441T184 442H187V261Q188 77 190 64Q193 49 204 40Q224 26 264 26Q290 26 311 35T343 58T363 90T375 120T379 144Q379 145 379 161T380 201T380 248V315Q380 361 370 372T320 385H302V431Q304 431 378 436T457 442H464V264Q464 84 465 81Q468 61 479 55T524 46H542V0Q540 0 467 -5T390 -11H383V58Z"></path><path id="MJX-2-TEX-N-72" d="M36 46H50Q89 46 97 60V68Q97 77 97 91T98 122T98 161T98 203Q98 234 98 269T98 328L97 351Q94 370 83 376T38 385H20V408Q20 431 22 431L32 432Q42 433 60 434T96 436Q112 437 131 438T160 441T171 442H174V373Q213 441 271 441H277Q322 441 343 419T364 373Q364 352 351 337T313 322Q288 322 276 338T263 372Q263 381 265 388T270 400T273 405Q271 407 250 401Q234 393 226 386Q179 341 179 207V154Q179 141 179 127T179 101T180 81T180 66V61Q181 59 183 57T188 54T193 51T200 49T207 48T216 47T225 47T235 46T245 46H276V0H267Q249 3 140 3Q37 3 28 0H20V46H36Z"></path><path id="MJX-2-TEX-N-73" d="M295 316Q295 356 268 385T190 414Q154 414 128 401Q98 382 98 349Q97 344 98 336T114 312T157 287Q175 282 201 278T245 269T277 256Q294 248 310 236T342 195T359 133Q359 71 321 31T198 -10H190Q138 -10 94 26L86 19L77 10Q71 4 65 -1L54 -11H46H42Q39 -11 33 -5V74V132Q33 153 35 157T45 162H54Q66 162 70 158T75 146T82 119T101 77Q136 26 198 26Q295 26 295 104Q295 133 277 151Q257 175 194 187T111 210Q75 227 54 256T33 318Q33 357 50 384T93 424T143 442T187 447H198Q238 447 268 432L283 424L292 431Q302 440 314 448H322H326Q329 448 335 442V310L329 304H301Q295 310 295 316Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mi"><use data-c="1D43B" xlink:href="#MJX-2-TEX-I-1D43B"></use></g><g data-mml-node="mo" transform="translate(1110.2,0)"><use data-c="D7" xlink:href="#MJX-2-TEX-N-D7"></use></g><g data-mml-node="mi" transform="translate(2110.4,0)"><use data-c="1D44A" xlink:href="#MJX-2-TEX-I-1D44A"></use></g><g data-mml-node="mo" transform="translate(3380.7,0)"><use data-c="D7" xlink:href="#MJX-2-TEX-N-D7"></use></g><g data-mml-node="mi" transform="translate(4380.9,0)"><use data-c="1D436" xlink:href="#MJX-2-TEX-I-1D436"></use></g><g data-mml-node="mo" transform="translate(5363.1,0)"><use data-c="D7" xlink:href="#MJX-2-TEX-N-D7"></use></g><g data-mml-node="mtext" transform="translate(6363.3,0)"><use data-c="47" xlink:href="#MJX-2-TEX-N-47"></use><use data-c="4C" xlink:href="#MJX-2-TEX-N-4C" transform="translate(785,0)"></use><use data-c="43" xlink:href="#MJX-2-TEX-N-43" transform="translate(1410,0)"></use><use data-c="4D" xlink:href="#MJX-2-TEX-N-4D" transform="translate(2132,0)"></use><use data-c="20" xlink:href="#MJX-2-TEX-N-20" transform="translate(3049,0)"></use><use data-c="46" xlink:href="#MJX-2-TEX-N-46" transform="translate(3299,0)"></use><use data-c="65" xlink:href="#MJX-2-TEX-N-65" transform="translate(3952,0)"></use><use data-c="61" xlink:href="#MJX-2-TEX-N-61" transform="translate(4396,0)"></use><use data-c="74" xlink:href="#MJX-2-TEX-N-74" transform="translate(4896,0)"></use><use data-c="75" xlink:href="#MJX-2-TEX-N-75" transform="translate(5285,0)"></use><use data-c="72" xlink:href="#MJX-2-TEX-N-72" transform="translate(5841,0)"></use><use data-c="65" xlink:href="#MJX-2-TEX-N-65" transform="translate(6233,0)"></use><use data-c="73" xlink:href="#MJX-2-TEX-N-73" transform="translate(6677,0)"></use></g></g></g></svg><p> See <code class="code" id="4bf5bd_233">glcm_cupy</code> for the GLCM Features.</p></dd><dt id="4bf5bd_234" data-expandable="false">glcm_padded_cached(ar, bin_from, bin_to, radius, step_size, features)</dt><dd><p><b id="4bf5bd_235">Computes the GLCM of the NDArray bands with padding, and caches it.</b></p><br><p> See <code class="code" id="4bf5bd_237">glcm_padded</code> for the parameters and output shape</p></dd><dt id="4bf5bd_238" data-expandable="false">append_glcm_padded_cached(ar, bin_from, bin_to, radius, step_size, features)</dt><dd><p><b id="4bf5bd_239">Computes the GLCM of the NDArray bands with padding, and caches it and also appends it onto the original array.</b></p><br><p> See <code class="code" id="4bf5bd_241">glcm_padded</code> for the parameters</p><br><p> The return shape is: </p><svg xmlns="http://www.w3.org/2000/svg" width="36.64ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 16194.8 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-4-TEX-I-1D43B" d="M228 637Q194 637 192 641Q191 643 191 649Q191 673 202 682Q204 683 219 683Q260 681 355 681Q389 681 418 681T463 682T483 682Q499 682 499 672Q499 670 497 658Q492 641 487 638H485Q483 638 480 638T473 638T464 637T455 637Q416 636 405 634T387 623Q384 619 355 500Q348 474 340 442T328 395L324 380Q324 378 469 378H614L615 381Q615 384 646 504Q674 619 674 627T617 637Q594 637 587 639T580 648Q580 650 582 660Q586 677 588 679T604 682Q609 682 646 681T740 680Q802 680 835 681T871 682Q888 682 888 672Q888 645 876 638H874Q872 638 869 638T862 638T853 637T844 637Q805 636 794 634T776 623Q773 618 704 340T634 58Q634 51 638 51Q646 48 692 46H723Q729 38 729 37T726 19Q722 6 716 0H701Q664 2 567 2Q533 2 504 2T458 2T437 1Q420 1 420 10Q420 15 423 24Q428 43 433 45Q437 46 448 46H454Q481 46 514 49Q520 50 522 50T528 55T534 64T540 82T547 110T558 153Q565 181 569 198Q602 330 602 331T457 332H312L279 197Q245 63 245 58Q245 51 253 49T303 46H334Q340 38 340 37T337 19Q333 6 327 0H312Q275 2 178 2Q144 2 115 2T69 2T48 1Q31 1 31 10Q31 12 34 24Q39 43 44 45Q48 46 59 46H65Q92 46 125 49Q139 52 144 61Q147 65 216 339T285 628Q285 635 228 637Z"></path><path id="MJX-4-TEX-N-D7" d="M630 29Q630 9 609 9Q604 9 587 25T493 118L389 222L284 117Q178 13 175 11Q171 9 168 9Q160 9 154 15T147 29Q147 36 161 51T255 146L359 250L255 354Q174 435 161 449T147 471Q147 480 153 485T168 490Q173 490 175 489Q178 487 284 383L389 278L493 382Q570 459 587 475T609 491Q630 491 630 471Q630 464 620 453T522 355L418 250L522 145Q606 61 618 48T630 29Z"></path><path id="MJX-4-TEX-I-1D44A" d="M436 683Q450 683 486 682T553 680Q604 680 638 681T677 682Q695 682 695 674Q695 670 692 659Q687 641 683 639T661 637Q636 636 621 632T600 624T597 615Q597 603 613 377T629 138L631 141Q633 144 637 151T649 170T666 200T690 241T720 295T759 362Q863 546 877 572T892 604Q892 619 873 628T831 637Q817 637 817 647Q817 650 819 660Q823 676 825 679T839 682Q842 682 856 682T895 682T949 681Q1015 681 1034 683Q1048 683 1048 672Q1048 666 1045 655T1038 640T1028 637Q1006 637 988 631T958 617T939 600T927 584L923 578L754 282Q586 -14 585 -15Q579 -22 561 -22Q546 -22 542 -17Q539 -14 523 229T506 480L494 462Q472 425 366 239Q222 -13 220 -15T215 -19Q210 -22 197 -22Q178 -22 176 -15Q176 -12 154 304T131 622Q129 631 121 633T82 637H58Q51 644 51 648Q52 671 64 683H76Q118 680 176 680Q301 680 313 683H323Q329 677 329 674T327 656Q322 641 318 637H297Q236 634 232 620Q262 160 266 136L501 550L499 587Q496 629 489 632Q483 636 447 637Q428 637 422 639T416 648Q416 650 418 660Q419 664 420 669T421 676T424 680T428 682T436 683Z"></path><path id="MJX-4-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-4-TEX-I-1D436" d="M50 252Q50 367 117 473T286 641T490 704Q580 704 633 653Q642 643 648 636T656 626L657 623Q660 623 684 649Q691 655 699 663T715 679T725 690L740 705H746Q760 705 760 698Q760 694 728 561Q692 422 692 421Q690 416 687 415T669 413H653Q647 419 647 422Q647 423 648 429T650 449T651 481Q651 552 619 605T510 659Q484 659 454 652T382 628T299 572T226 479Q194 422 175 346T156 222Q156 108 232 58Q280 24 350 24Q441 24 512 92T606 240Q610 253 612 255T628 257Q648 257 648 248Q648 243 647 239Q618 132 523 55T319 -22Q206 -22 128 53T50 252Z"></path><path id="MJX-4-TEX-N-47" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q401 658 376 654T316 633T254 592T205 519T177 411Q173 369 173 335Q173 259 192 201T238 111T302 58T370 31T431 24Q478 24 513 45T559 100Q562 110 562 160V212Q561 213 557 216T551 220T542 223T526 225T502 226T463 227H437V273H449L609 270Q715 270 727 273H735V227H721Q674 227 668 215Q666 211 666 108V6Q660 0 657 0Q653 0 639 10Q617 25 600 42L587 54Q571 27 524 3T406 -22Q317 -22 238 22T108 151T56 342Z"></path><path id="MJX-4-TEX-N-4C" d="M128 622Q121 629 117 631T101 634T58 637H25V683H36Q48 680 182 680Q324 680 348 683H360V637H333Q273 637 258 635T233 622L232 342V129Q232 57 237 52Q243 47 313 47Q384 47 410 53Q470 70 498 110T536 221Q536 226 537 238T540 261T542 272T562 273H582V268Q580 265 568 137T554 5V0H25V46H58Q100 47 109 49T128 61V622Z"></path><path id="MJX-4-TEX-N-43" d="M56 342Q56 428 89 500T174 615T283 681T391 705Q394 705 400 705T408 704Q499 704 569 636L582 624L612 663Q639 700 643 704Q644 704 647 704T653 705H657Q660 705 666 699V419L660 413H626Q620 419 619 430Q610 512 571 572T476 651Q457 658 426 658Q322 658 252 588Q173 509 173 342Q173 221 211 151Q232 111 263 84T328 45T384 29T428 24Q517 24 571 93T626 244Q626 251 632 257H660L666 251V236Q661 133 590 56T403 -21Q262 -21 159 83T56 342Z"></path><path id="MJX-4-TEX-N-4D" d="M132 622Q125 629 121 631T105 634T62 637H29V683H135Q221 683 232 682T249 675Q250 674 354 398L458 124L562 398Q666 674 668 675Q671 681 683 682T781 683H887V637H854Q814 636 803 634T785 622V61Q791 51 802 49T854 46H887V0H876Q855 3 736 3Q605 3 596 0H585V46H618Q660 47 669 49T688 61V347Q688 424 688 461T688 546T688 613L687 632Q454 14 450 7Q446 1 430 1T410 7Q409 9 292 316L176 624V606Q175 588 175 543T175 463T175 356L176 86Q187 50 261 46H278V0H269Q254 3 154 3Q52 3 37 0H29V46H46Q78 48 98 56T122 69T132 86V622Z"></path><path id="MJX-4-TEX-N-20" d=""></path><path id="MJX-4-TEX-N-46" d="M128 619Q121 626 117 628T101 631T58 634H25V680H582V676Q584 670 596 560T610 444V440H570V444Q563 493 561 501Q555 538 543 563T516 601T477 622T431 631T374 633H334H286Q252 633 244 631T233 621Q232 619 232 490V363H284Q287 363 303 363T327 364T349 367T372 373T389 385Q407 403 410 459V480H450V200H410V221Q407 276 389 296Q381 303 371 307T348 313T327 316T303 317T284 317H232V189L233 61Q240 54 245 52T270 48T333 46H360V0H348Q324 3 182 3Q51 3 36 0H25V46H58Q100 47 109 49T128 61V619Z"></path><path id="MJX-4-TEX-N-65" d="M28 218Q28 273 48 318T98 391T163 433T229 448Q282 448 320 430T378 380T406 316T415 245Q415 238 408 231H126V216Q126 68 226 36Q246 30 270 30Q312 30 342 62Q359 79 369 104L379 128Q382 131 395 131H398Q415 131 415 121Q415 117 412 108Q393 53 349 21T250 -11Q155 -11 92 58T28 218ZM333 275Q322 403 238 411H236Q228 411 220 410T195 402T166 381T143 340T127 274V267H333V275Z"></path><path id="MJX-4-TEX-N-61" d="M137 305T115 305T78 320T63 359Q63 394 97 421T218 448Q291 448 336 416T396 340Q401 326 401 309T402 194V124Q402 76 407 58T428 40Q443 40 448 56T453 109V145H493V106Q492 66 490 59Q481 29 455 12T400 -6T353 12T329 54V58L327 55Q325 52 322 49T314 40T302 29T287 17T269 6T247 -2T221 -8T190 -11Q130 -11 82 20T34 107Q34 128 41 147T68 188T116 225T194 253T304 268H318V290Q318 324 312 340Q290 411 215 411Q197 411 181 410T156 406T148 403Q170 388 170 359Q170 334 154 320ZM126 106Q126 75 150 51T209 26Q247 26 276 49T315 109Q317 116 318 175Q318 233 317 233Q309 233 296 232T251 223T193 203T147 166T126 106Z"></path><path id="MJX-4-TEX-N-74" d="M27 422Q80 426 109 478T141 600V615H181V431H316V385H181V241Q182 116 182 100T189 68Q203 29 238 29Q282 29 292 100Q293 108 293 146V181H333V146V134Q333 57 291 17Q264 -10 221 -10Q187 -10 162 2T124 33T105 68T98 100Q97 107 97 248V385H18V422H27Z"></path><path id="MJX-4-TEX-N-75" d="M383 58Q327 -10 256 -10H249Q124 -10 105 89Q104 96 103 226Q102 335 102 348T96 369Q86 385 36 385H25V408Q25 431 27 431L38 432Q48 433 67 434T105 436Q122 437 142 438T172 441T184 442H187V261Q188 77 190 64Q193 49 204 40Q224 26 264 26Q290 26 311 35T343 58T363 90T375 120T379 144Q379 145 379 161T380 201T380 248V315Q380 361 370 372T320 385H302V431Q304 431 378 436T457 442H464V264Q464 84 465 81Q468 61 479 55T524 46H542V0Q540 0 467 -5T390 -11H383V58Z"></path><path id="MJX-4-TEX-N-72" d="M36 46H50Q89 46 97 60V68Q97 77 97 91T98 122T98 161T98 203Q98 234 98 269T98 328L97 351Q94 370 83 376T38 385H20V408Q20 431 22 431L32 432Q42 433 60 434T96 436Q112 437 131 438T160 441T171 442H174V373Q213 441 271 441H277Q322 441 343 419T364 373Q364 352 351 337T313 322Q288 322 276 338T263 372Q263 381 265 388T270 400T273 405Q271 407 250 401Q234 393 226 386Q179 341 179 207V154Q179 141 179 127T179 101T180 81T180 66V61Q181 59 183 57T188 54T193 51T200 49T207 48T216 47T225 47T235 46T245 46H276V0H267Q249 3 140 3Q37 3 28 0H20V46H36Z"></path><path id="MJX-4-TEX-N-73" d="M295 316Q295 356 268 385T190 414Q154 414 128 401Q98 382 98 349Q97 344 98 336T114 312T157 287Q175 282 201 278T245 269T277 256Q294 248 310 236T342 195T359 133Q359 71 321 31T198 -10H190Q138 -10 94 26L86 19L77 10Q71 4 65 -1L54 -11H46H42Q39 -11 33 -5V74V132Q33 153 35 157T45 162H54Q66 162 70 158T75 146T82 119T101 77Q136 26 198 26Q295 26 295 104Q295 133 277 151Q257 175 194 187T111 210Q75 227 54 256T33 318Q33 357 50 384T93 424T143 442T187 447H198Q238 447 268 432L283 424L292 431Q302 440 314 448H322H326Q329 448 335 442V310L329 304H301Q295 310 295 316Z"></path><path id="MJX-4-TEX-N-2B" d="M56 237T56 250T70 270H369V420L370 570Q380 583 389 583Q402 583 409 568V270H707Q722 262 722 250T707 230H409V-68Q401 -82 391 -82H389H387Q375 -82 369 -68V230H70Q56 237 56 250Z"></path><path id="MJX-4-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mi"><use data-c="1D43B" xlink:href="#MJX-4-TEX-I-1D43B"></use></g><g data-mml-node="mo" transform="translate(1110.2,0)"><use data-c="D7" xlink:href="#MJX-4-TEX-N-D7"></use></g><g data-mml-node="mi" transform="translate(2110.4,0)"><use data-c="1D44A" xlink:href="#MJX-4-TEX-I-1D44A"></use></g><g data-mml-node="mo" transform="translate(3380.7,0)"><use data-c="D7" xlink:href="#MJX-4-TEX-N-D7"></use></g><g data-mml-node="mo" transform="translate(4380.9,0)"><use data-c="28" xlink:href="#MJX-4-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(4769.9,0)"><use data-c="1D436" xlink:href="#MJX-4-TEX-I-1D436"></use></g><g data-mml-node="mo" transform="translate(5752.1,0)"><use data-c="D7" xlink:href="#MJX-4-TEX-N-D7"></use></g><g data-mml-node="mtext" transform="translate(6752.3,0)"><use data-c="47" xlink:href="#MJX-4-TEX-N-47"></use><use data-c="4C" xlink:href="#MJX-4-TEX-N-4C" transform="translate(785,0)"></use><use data-c="43" xlink:href="#MJX-4-TEX-N-43" transform="translate(1410,0)"></use><use data-c="4D" xlink:href="#MJX-4-TEX-N-4D" transform="translate(2132,0)"></use><use data-c="20" xlink:href="#MJX-4-TEX-N-20" transform="translate(3049,0)"></use><use data-c="46" xlink:href="#MJX-4-TEX-N-46" transform="translate(3299,0)"></use><use data-c="65" xlink:href="#MJX-4-TEX-N-65" transform="translate(3952,0)"></use><use data-c="61" xlink:href="#MJX-4-TEX-N-61" transform="translate(4396,0)"></use><use data-c="74" xlink:href="#MJX-4-TEX-N-74" transform="translate(4896,0)"></use><use data-c="75" xlink:href="#MJX-4-TEX-N-75" transform="translate(5285,0)"></use><use data-c="72" xlink:href="#MJX-4-TEX-N-72" transform="translate(5841,0)"></use><use data-c="65" xlink:href="#MJX-4-TEX-N-65" transform="translate(6233,0)"></use><use data-c="73" xlink:href="#MJX-4-TEX-N-73" transform="translate(6677,0)"></use></g><g data-mml-node="mo" transform="translate(14045.6,0)"><use data-c="2B" xlink:href="#MJX-4-TEX-N-2B"></use></g><g data-mml-node="mi" transform="translate(15045.8,0)"><use data-c="1D436" xlink:href="#MJX-4-TEX-I-1D436"></use></g><g data-mml-node="mo" transform="translate(15805.8,0)"><use data-c="29" xlink:href="#MJX-4-TEX-N-29"></use></g></g></g></svg><p> The function automatically flattens the last 2 dimensions of the GLCM features, and appends it onto the original array.</p></dd></dl></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-morphology.html">preprocessing.morphology</a>   <a class="navigation-links__next" href="train-frdc-lightning.html">train.frdc_datamodule &amp; frdc_module</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/preprocessing-morphology.html b/docs/preprocessing-morphology.html
index edc343b4..0c21fd83 100644
--- a/docs/preprocessing-morphology.html
+++ b/docs/preprocessing-morphology.html
@@ -1,15 +1,13 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0968833"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.morphology | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.morphology | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/preprocessing-morphology.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.morphology | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/preprocessing-morphology.html#webpage", "url": "/d/0.0.7/preprocessing-morphology.html", "name": "preprocessing.morphology | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.morphology" data-main-title="preprocessing.morphology" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.morphology"   id="preprocessing.morphology.md">preprocessing.morphology</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;19e6981_159\&quot;\u003ePerforms morphological operations on the NDArray bands.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="tip" data-title="" id="19e6981_131"><p id="19e6981_132">This is currently only used for auto-segmentation. If you want to use predefined segmentation see <a href="preprocessing-extract-segments.html" id="19e6981_133" data-tooltip="A boundary is a Rect object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates."  >preprocessing.extract_segments</a>.</p></aside><section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><aside class="prompt" data-type="warning" data-title="" id="19e6981_134"><p>Assumes shape H x W x C, where C is the number of bands.</p></aside><dl id="19e6981_135" data-style="title-left" data-title-width="medium"><dt id="19e6981_136" data-expandable="false">threshold_binary_mask</dt><dd><p><b id="19e6981_137">Thresholds a selected NDArray bands to yield a binary mask.</b></p></dd><dt id="19e6981_138" data-expandable="false">binary_watershed</dt><dd><p><b id="19e6981_139">Performs watershed on a binary mask to yield a mapped label classification</b></p></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="19e6981_140">Perform auto-segmentation on a dataset to yield a label classification.</p><div class="code-block" data-lang="python"         >
-from frdc.load import FRDCDataset
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.morphology | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.morphology | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/preprocessing-morphology.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.morphology | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/preprocessing-morphology.html#webpage", "url": "/d/0.0.8/preprocessing-morphology.html", "name": "preprocessing.morphology | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.morphology" data-main-title="preprocessing.morphology" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.morphology"   id="preprocessing.morphology.md">preprocessing.morphology</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;6f11b42e_209\&quot;\u003ePerforms morphological operations on the NDArray bands.\u003c/p\u003e&quot;]}"></div> <aside class="prompt" data-type="tip" data-title="" id="6f11b42e_181"><p id="6f11b42e_182">This is currently only used for auto-segmentation. If you want to use predefined segmentation see <a href="preprocessing-extract-segments.html" id="6f11b42e_183" data-tooltip="A boundary is a Rect object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates."  >preprocessing.extract_segments</a>.</p></aside><section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><aside class="prompt" data-type="warning" data-title="" id="6f11b42e_184"><p>Assumes shape H x W x C, where C is the number of bands.</p></aside><dl id="6f11b42e_185" data-style="title-left" data-title-width="medium"><dt id="6f11b42e_186" data-expandable="false">threshold_binary_mask</dt><dd><p><b id="6f11b42e_187">Thresholds a selected NDArray bands to yield a binary mask.</b></p></dd><dt id="6f11b42e_188" data-expandable="false">binary_watershed</dt><dd><p><b id="6f11b42e_189">Performs watershed on a binary mask to yield a mapped label classification</b></p></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><p id="6f11b42e_190">Perform auto-segmentation on a dataset to yield a label classification.</p><div class="code-block" data-lang="python"         >
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.morphology import (
     threshold_binary_mask, binary_watershed
 )
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 mask = threshold_binary_mask(ar, order.index('NIR'), 90 / 256)
 ar_label = binary_watershed(mask)
-</div></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="19e6981_142" data-style="title-top"><dt id="19e6981_143" data-expandable="false">threshold_binary_mask(ar, band_idx, threshold_value)</dt><dd><p><b id="19e6981_144">Thresholds a selected NDArray bands to yield a binary mask as <code class="code" id="19e6981_145">np.ndarray</code></b></p><br><p> This is equivalent to </p><div class="code-block" data-lang="python"         >
+</div></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="6f11b42e_192" data-style="title-top"><dt id="6f11b42e_193" data-expandable="false">threshold_binary_mask(ar, band_idx, threshold_value)</dt><dd><p><b id="6f11b42e_194">Thresholds a selected NDArray bands to yield a binary mask as <code class="code" id="6f11b42e_195">np.ndarray</code></b></p><br><p> This is equivalent to </p><div class="code-block" data-lang="python"         >
 ar[..., band_idx] &gt; threshold_value
-</div></dd><dt id="19e6981_148" data-expandable="false">binary_watershed(ar_mask, peaks_footprint, watershed_compactness)</dt><dd><p><b id="19e6981_149">Performs watershed on a binary mask to yield a mapped label classification as a <code class="code" id="19e6981_150">np.ndarray</code></b></p><br><ul class="list _ul" id="19e6981_152"><li class="list__item" id="19e6981_153"><p><code class="code" id="19e6981_154">peaks_footprint</code> is the footprint of <code class="code" id="19e6981_155">skimage.feature.peak_local_max</code></p></li><li class="list__item" id="19e6981_156"><p><code class="code" id="19e6981_157">watershed_compactness</code> is the compactness of <code class="code" id="19e6981_158">skimage.morphology.watershed</code></p></li></ul></dd></dl></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-extract-segments.html">preprocessing.extract_segments</a>   <a class="navigation-links__next" href="preprocessing-glcm-padded.html">preprocessing.glcm_padded</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div></dd><dt id="6f11b42e_198" data-expandable="false">binary_watershed(ar_mask, peaks_footprint, watershed_compactness)</dt><dd><p><b id="6f11b42e_199">Performs watershed on a binary mask to yield a mapped label classification as a <code class="code" id="6f11b42e_200">np.ndarray</code></b></p><br><ul class="list _ul" id="6f11b42e_202"><li class="list__item" id="6f11b42e_203"><p><code class="code" id="6f11b42e_204">peaks_footprint</code> is the footprint of <code class="code" id="6f11b42e_205">skimage.feature.peak_local_max</code></p></li><li class="list__item" id="6f11b42e_206"><p><code class="code" id="6f11b42e_207">watershed_compactness</code> is the compactness of <code class="code" id="6f11b42e_208">skimage.morphology.watershed</code></p></li></ul></dd></dl></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-extract-segments.html">preprocessing.extract_segments</a>   <a class="navigation-links__next" href="preprocessing-glcm-padded.html">preprocessing.glcm_padded</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/preprocessing-scale.html b/docs/preprocessing-scale.html
index c8213f8e..2dd27886 100644
--- a/docs/preprocessing-scale.html
+++ b/docs/preprocessing-scale.html
@@ -1,15 +1,13 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.scale | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.scale | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/preprocessing-scale.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.scale | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/preprocessing-scale.html#webpage", "url": "/d/0.0.7/preprocessing-scale.html", "name": "preprocessing.scale | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.scale" data-main-title="preprocessing.scale" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.scale"   id="preprocessing.scale.md">preprocessing.scale</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;d5a9e2d8_148\&quot;\u003eScales the NDArray bands.\u003c/p\u003e&quot;]}"></div> <section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><aside class="prompt" data-type="warning" data-title="" id="d5a9e2d8_133"><p>Assumes shape H x W x C, where C is the number of bands.</p></aside><dl id="d5a9e2d8_134" data-style="title-left" data-title-width="medium"><dt id="d5a9e2d8_135" data-expandable="false">scale_0_1_per_band</dt><dd><p><b id="d5a9e2d8_136">Scales the NDArray bands to [0, 1] per band.</b></p><svg xmlns="http://www.w3.org/2000/svg" width="32.393ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 14317.9 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-1-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-1-TEX-I-1D465" d="M52 289Q59 331 106 386T222 442Q257 442 286 424T329 379Q371 442 430 442Q467 442 494 420T522 361Q522 332 508 314T481 292T458 288Q439 288 427 299T415 328Q415 374 465 391Q454 404 425 404Q412 404 406 402Q368 386 350 336Q290 115 290 78Q290 50 306 38T341 26Q378 26 414 59T463 140Q466 150 469 151T485 153H489Q504 153 504 145Q504 144 502 134Q486 77 440 33T333 -11Q263 -11 227 52Q186 -10 133 -10H127Q78 -10 57 16T35 71Q35 103 54 123T99 143Q142 143 142 101Q142 81 130 66T107 46T94 41L91 40Q91 39 97 36T113 29T132 26Q168 26 194 71Q203 87 217 139T245 247T261 313Q266 340 266 352Q266 380 251 392T217 404Q177 404 142 372T93 290Q91 281 88 280T72 278H58Q52 284 52 289Z"></path><path id="MJX-1-TEX-N-2212" d="M84 237T84 250T98 270H679Q694 262 694 250T679 230H98Q84 237 84 250Z"></path><path id="MJX-1-TEX-N-6D" d="M41 46H55Q94 46 102 60V68Q102 77 102 91T102 122T103 161T103 203Q103 234 103 269T102 328V351Q99 370 88 376T43 385H25V408Q25 431 27 431L37 432Q47 433 65 434T102 436Q119 437 138 438T167 441T178 442H181V402Q181 364 182 364T187 369T199 384T218 402T247 421T285 437Q305 442 336 442Q351 442 364 440T387 434T406 426T421 417T432 406T441 395T448 384T452 374T455 366L457 361L460 365Q463 369 466 373T475 384T488 397T503 410T523 422T546 432T572 439T603 442Q729 442 740 329Q741 322 741 190V104Q741 66 743 59T754 49Q775 46 803 46H819V0H811L788 1Q764 2 737 2T699 3Q596 3 587 0H579V46H595Q656 46 656 62Q657 64 657 200Q656 335 655 343Q649 371 635 385T611 402T585 404Q540 404 506 370Q479 343 472 315T464 232V168V108Q464 78 465 68T468 55T477 49Q498 46 526 46H542V0H534L510 1Q487 2 460 2T422 3Q319 3 310 0H302V46H318Q379 46 379 62Q380 64 380 200Q379 335 378 343Q372 371 358 385T334 402T308 404Q263 404 229 370Q202 343 195 315T187 232V168V108Q187 78 188 68T191 55T200 49Q221 46 249 46H265V0H257L234 1Q210 2 183 2T145 3Q42 3 33 0H25V46H41Z"></path><path id="MJX-1-TEX-N-69" d="M69 609Q69 637 87 653T131 669Q154 667 171 652T188 609Q188 579 171 564T129 549Q104 549 87 564T69 609ZM247 0Q232 3 143 3Q132 3 106 3T56 1L34 0H26V46H42Q70 46 91 49Q100 53 102 60T104 102V205V293Q104 345 102 359T88 378Q74 385 41 385H30V408Q30 431 32 431L42 432Q52 433 70 434T106 436Q123 437 142 438T171 441T182 442H185V62Q190 52 197 50T232 46H255V0H247Z"></path><path id="MJX-1-TEX-N-6E" d="M41 46H55Q94 46 102 60V68Q102 77 102 91T102 122T103 161T103 203Q103 234 103 269T102 328V351Q99 370 88 376T43 385H25V408Q25 431 27 431L37 432Q47 433 65 434T102 436Q119 437 138 438T167 441T178 442H181V402Q181 364 182 364T187 369T199 384T218 402T247 421T285 437Q305 442 336 442Q450 438 463 329Q464 322 464 190V104Q464 66 466 59T477 49Q498 46 526 46H542V0H534L510 1Q487 2 460 2T422 3Q319 3 310 0H302V46H318Q379 46 379 62Q380 64 380 200Q379 335 378 343Q372 371 358 385T334 402T308 404Q263 404 229 370Q202 343 195 315T187 232V168V108Q187 78 188 68T191 55T200 49Q221 46 249 46H265V0H257L234 1Q210 2 183 2T145 3Q42 3 33 0H25V46H41Z"></path><path id="MJX-1-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path><path id="MJX-1-TEX-N-2F" d="M423 750Q432 750 438 744T444 730Q444 725 271 248T92 -240Q85 -250 75 -250Q68 -250 62 -245T56 -231Q56 -221 230 257T407 740Q411 750 423 750Z"></path><path id="MJX-1-TEX-N-61" d="M137 305T115 305T78 320T63 359Q63 394 97 421T218 448Q291 448 336 416T396 340Q401 326 401 309T402 194V124Q402 76 407 58T428 40Q443 40 448 56T453 109V145H493V106Q492 66 490 59Q481 29 455 12T400 -6T353 12T329 54V58L327 55Q325 52 322 49T314 40T302 29T287 17T269 6T247 -2T221 -8T190 -11Q130 -11 82 20T34 107Q34 128 41 147T68 188T116 225T194 253T304 268H318V290Q318 324 312 340Q290 411 215 411Q197 411 181 410T156 406T148 403Q170 388 170 359Q170 334 154 320ZM126 106Q126 75 150 51T209 26Q247 26 276 49T315 109Q317 116 318 175Q318 233 317 233Q309 233 296 232T251 223T193 203T147 166T126 106Z"></path><path id="MJX-1-TEX-N-78" d="M201 0Q189 3 102 3Q26 3 17 0H11V46H25Q48 47 67 52T96 61T121 78T139 96T160 122T180 150L226 210L168 288Q159 301 149 315T133 336T122 351T113 363T107 370T100 376T94 379T88 381T80 383Q74 383 44 385H16V431H23Q59 429 126 429Q219 429 229 431H237V385Q201 381 201 369Q201 367 211 353T239 315T268 274L272 270L297 304Q329 345 329 358Q329 364 327 369T322 376T317 380T310 384L307 385H302V431H309Q324 428 408 428Q487 428 493 431H499V385H492Q443 385 411 368Q394 360 377 341T312 257L296 236L358 151Q424 61 429 57T446 50Q464 46 499 46H516V0H510H502Q494 1 482 1T457 2T432 2T414 3Q403 3 377 3T327 1L304 0H295V46H298Q309 46 320 51T331 63Q331 65 291 120L250 175Q249 174 219 133T185 88Q181 83 181 74Q181 63 188 55T206 46Q208 46 208 23V0H201Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mo"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(389,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(1183.2,0)"><use data-c="2212" xlink:href="#MJX-1-TEX-N-2212"></use></g><g data-mml-node="mo" transform="translate(2183.4,0)"><use data-c="6D" xlink:href="#MJX-1-TEX-N-6D"></use><use data-c="69" xlink:href="#MJX-1-TEX-N-69" transform="translate(833,0)"></use><use data-c="6E" xlink:href="#MJX-1-TEX-N-6E" transform="translate(1111,0)"></use></g><g data-mml-node="mo" transform="translate(3850.4,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(4239.4,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(4811.4,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="mo" transform="translate(5200.4,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="TeXAtom" data-mjx-texclass="ORD" transform="translate(5589.4,0)"><g data-mml-node="mo"><use data-c="2F" xlink:href="#MJX-1-TEX-N-2F"></use></g></g><g data-mml-node="mo" transform="translate(6089.4,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mo" transform="translate(6478.4,0)"><use data-c="6D" xlink:href="#MJX-1-TEX-N-6D"></use><use data-c="61" xlink:href="#MJX-1-TEX-N-61" transform="translate(833,0)"></use><use data-c="78" xlink:href="#MJX-1-TEX-N-78" transform="translate(1333,0)"></use></g><g data-mml-node="mo" transform="translate(8339.4,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(8728.4,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(9300.4,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="mo" transform="translate(9911.7,0)"><use data-c="2212" xlink:href="#MJX-1-TEX-N-2212"></use></g><g data-mml-node="mo" transform="translate(10911.9,0)"><use data-c="6D" xlink:href="#MJX-1-TEX-N-6D"></use><use data-c="69" xlink:href="#MJX-1-TEX-N-69" transform="translate(833,0)"></use><use data-c="6E" xlink:href="#MJX-1-TEX-N-6E" transform="translate(1111,0)"></use></g><g data-mml-node="mo" transform="translate(12578.9,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(12967.9,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(13539.9,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="mo" transform="translate(13928.9,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g></g></g></svg></dd><dt id="d5a9e2d8_138" data-expandable="false">scale_normal_per_band</dt><dd><p><b id="d5a9e2d8_139">Scales the NDArray bands to zero mean unit variance per band.</b></p><svg xmlns="http://www.w3.org/2000/svg" width="9.607ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 4246.4 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-3-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-3-TEX-I-1D465" d="M52 289Q59 331 106 386T222 442Q257 442 286 424T329 379Q371 442 430 442Q467 442 494 420T522 361Q522 332 508 314T481 292T458 288Q439 288 427 299T415 328Q415 374 465 391Q454 404 425 404Q412 404 406 402Q368 386 350 336Q290 115 290 78Q290 50 306 38T341 26Q378 26 414 59T463 140Q466 150 469 151T485 153H489Q504 153 504 145Q504 144 502 134Q486 77 440 33T333 -11Q263 -11 227 52Q186 -10 133 -10H127Q78 -10 57 16T35 71Q35 103 54 123T99 143Q142 143 142 101Q142 81 130 66T107 46T94 41L91 40Q91 39 97 36T113 29T132 26Q168 26 194 71Q203 87 217 139T245 247T261 313Q266 340 266 352Q266 380 251 392T217 404Q177 404 142 372T93 290Q91 281 88 280T72 278H58Q52 284 52 289Z"></path><path id="MJX-3-TEX-N-2212" d="M84 237T84 250T98 270H679Q694 262 694 250T679 230H98Q84 237 84 250Z"></path><path id="MJX-3-TEX-I-1D707" d="M58 -216Q44 -216 34 -208T23 -186Q23 -176 96 116T173 414Q186 442 219 442Q231 441 239 435T249 423T251 413Q251 401 220 279T187 142Q185 131 185 107V99Q185 26 252 26Q261 26 270 27T287 31T302 38T315 45T327 55T338 65T348 77T356 88T365 100L372 110L408 253Q444 395 448 404Q461 431 491 431Q504 431 512 424T523 412T525 402L449 84Q448 79 448 68Q448 43 455 35T476 26Q485 27 496 35Q517 55 537 131Q543 151 547 152Q549 153 557 153H561Q580 153 580 144Q580 138 575 117T555 63T523 13Q510 0 491 -8Q483 -10 467 -10Q446 -10 429 -4T402 11T385 29T376 44T374 51L368 45Q362 39 350 30T324 12T288 -4T246 -11Q199 -11 153 12L129 -85Q108 -167 104 -180T92 -202Q76 -216 58 -216Z"></path><path id="MJX-3-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path><path id="MJX-3-TEX-N-2F" d="M423 750Q432 750 438 744T444 730Q444 725 271 248T92 -240Q85 -250 75 -250Q68 -250 62 -245T56 -231Q56 -221 230 257T407 740Q411 750 423 750Z"></path><path id="MJX-3-TEX-I-1D70E" d="M184 -11Q116 -11 74 34T31 147Q31 247 104 333T274 430Q275 431 414 431H552Q553 430 555 429T559 427T562 425T565 422T567 420T569 416T570 412T571 407T572 401Q572 357 507 357Q500 357 490 357T476 358H416L421 348Q439 310 439 263Q439 153 359 71T184 -11ZM361 278Q361 358 276 358Q152 358 115 184Q114 180 114 178Q106 141 106 117Q106 67 131 47T188 26Q242 26 287 73Q316 103 334 153T356 233T361 278Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mo"><use data-c="28" xlink:href="#MJX-3-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(389,0)"><use data-c="1D465" xlink:href="#MJX-3-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(1183.2,0)"><use data-c="2212" xlink:href="#MJX-3-TEX-N-2212"></use></g><g data-mml-node="mi" transform="translate(2183.4,0)"><use data-c="1D707" xlink:href="#MJX-3-TEX-I-1D707"></use></g><g data-mml-node="mo" transform="translate(2786.4,0)"><use data-c="29" xlink:href="#MJX-3-TEX-N-29"></use></g><g data-mml-node="TeXAtom" data-mjx-texclass="ORD" transform="translate(3175.4,0)"><g data-mml-node="mo"><use data-c="2F" xlink:href="#MJX-3-TEX-N-2F"></use></g></g><g data-mml-node="mi" transform="translate(3675.4,0)"><use data-c="1D70E" xlink:href="#MJX-3-TEX-I-1D70E"></use></g></g></g></svg></dd><dt id="d5a9e2d8_141" data-expandable="false">scale_static_per_band</dt><dd><p><b id="d5a9e2d8_142">Scales the NDArray bands by a predefined configuration.</b> Take a look at <code class="code" id="d5a9e2d8_143">frdc.conf.BAND_MAX_CONFIG</code> for an example. </p><svg xmlns="http://www.w3.org/2000/svg" width="17.379ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 7681.5 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-5-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-5-TEX-I-1D465" d="M52 289Q59 331 106 386T222 442Q257 442 286 424T329 379Q371 442 430 442Q467 442 494 420T522 361Q522 332 508 314T481 292T458 288Q439 288 427 299T415 328Q415 374 465 391Q454 404 425 404Q412 404 406 402Q368 386 350 336Q290 115 290 78Q290 50 306 38T341 26Q378 26 414 59T463 140Q466 150 469 151T485 153H489Q504 153 504 145Q504 144 502 134Q486 77 440 33T333 -11Q263 -11 227 52Q186 -10 133 -10H127Q78 -10 57 16T35 71Q35 103 54 123T99 143Q142 143 142 101Q142 81 130 66T107 46T94 41L91 40Q91 39 97 36T113 29T132 26Q168 26 194 71Q203 87 217 139T245 247T261 313Q266 340 266 352Q266 380 251 392T217 404Q177 404 142 372T93 290Q91 281 88 280T72 278H58Q52 284 52 289Z"></path><path id="MJX-5-TEX-N-2212" d="M84 237T84 250T98 270H679Q694 262 694 250T679 230H98Q84 237 84 250Z"></path><path id="MJX-5-TEX-I-1D450" d="M34 159Q34 268 120 355T306 442Q362 442 394 418T427 355Q427 326 408 306T360 285Q341 285 330 295T319 325T330 359T352 380T366 386H367Q367 388 361 392T340 400T306 404Q276 404 249 390Q228 381 206 359Q162 315 142 235T121 119Q121 73 147 50Q169 26 205 26H209Q321 26 394 111Q403 121 406 121Q410 121 419 112T429 98T420 83T391 55T346 25T282 0T202 -11Q127 -11 81 37T34 159Z"></path><path id="MJX-5-TEX-N-30" d="M96 585Q152 666 249 666Q297 666 345 640T423 548Q460 465 460 320Q460 165 417 83Q397 41 362 16T301 -15T250 -22Q224 -22 198 -16T137 16T82 83Q39 165 39 320Q39 494 96 585ZM321 597Q291 629 250 629Q208 629 178 597Q153 571 145 525T137 333Q137 175 145 125T181 46Q209 16 250 16Q290 16 318 46Q347 76 354 130T362 333Q362 478 354 524T321 597Z"></path><path id="MJX-5-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path><path id="MJX-5-TEX-N-2F" d="M423 750Q432 750 438 744T444 730Q444 725 271 248T92 -240Q85 -250 75 -250Q68 -250 62 -245T56 -231Q56 -221 230 257T407 740Q411 750 423 750Z"></path><path id="MJX-5-TEX-N-31" d="M213 578L200 573Q186 568 160 563T102 556H83V602H102Q149 604 189 617T245 641T273 663Q275 666 285 666Q294 666 302 660V361L303 61Q310 54 315 52T339 48T401 46H427V0H416Q395 3 257 3Q121 3 100 0H88V46H114Q136 46 152 46T177 47T193 50T201 52T207 57T213 61V578Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mo"><use data-c="28" xlink:href="#MJX-5-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(389,0)"><use data-c="1D465" xlink:href="#MJX-5-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(1183.2,0)"><use data-c="2212" xlink:href="#MJX-5-TEX-N-2212"></use></g><g data-mml-node="msub" transform="translate(2183.4,0)"><g data-mml-node="mi"><use data-c="1D450" xlink:href="#MJX-5-TEX-I-1D450"></use></g><g data-mml-node="mn" transform="translate(466,-150) scale(0.707)"><use data-c="30" xlink:href="#MJX-5-TEX-N-30"></use></g></g><g data-mml-node="mo" transform="translate(3053,0)"><use data-c="29" xlink:href="#MJX-5-TEX-N-29"></use></g><g data-mml-node="TeXAtom" data-mjx-texclass="ORD" transform="translate(3442,0)"><g data-mml-node="mo"><use data-c="2F" xlink:href="#MJX-5-TEX-N-2F"></use></g></g><g data-mml-node="mo" transform="translate(3942,0)"><use data-c="28" xlink:href="#MJX-5-TEX-N-28"></use></g><g data-mml-node="msub" transform="translate(4331,0)"><g data-mml-node="mi"><use data-c="1D450" xlink:href="#MJX-5-TEX-I-1D450"></use></g><g data-mml-node="mn" transform="translate(466,-150) scale(0.707)"><use data-c="31" xlink:href="#MJX-5-TEX-N-31"></use></g></g><g data-mml-node="mo" transform="translate(5422.8,0)"><use data-c="2212" xlink:href="#MJX-5-TEX-N-2212"></use></g><g data-mml-node="msub" transform="translate(6423,0)"><g data-mml-node="mi"><use data-c="1D450" xlink:href="#MJX-5-TEX-I-1D450"></use></g><g data-mml-node="mn" transform="translate(466,-150) scale(0.707)"><use data-c="30" xlink:href="#MJX-5-TEX-N-30"></use></g></g><g data-mml-node="mo" transform="translate(7292.5,0)"><use data-c="29" xlink:href="#MJX-5-TEX-N-29"></use></g></g></g></svg></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><div class="code-block" data-lang="python"         >
-from frdc.load import FRDCDataset
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>preprocessing.scale | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"functions","level":0,"title":"Functions","anchor":"#functions"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="preprocessing.scale | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/preprocessing-scale.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="preprocessing.scale | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/preprocessing-scale.html#webpage", "url": "/d/0.0.8/preprocessing-scale.html", "name": "preprocessing.scale | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="preprocessing.scale" data-main-title="preprocessing.scale" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="preprocessing.scale"   id="preprocessing.scale.md">preprocessing.scale</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;37677bb8_230\&quot;\u003eScales the NDArray bands.\u003c/p\u003e&quot;]}"></div> <section class="chapter"><h2 id="functions" data-toc="functions"   >Functions</h2><aside class="prompt" data-type="warning" data-title="" id="37677bb8_215"><p>Assumes shape H x W x C, where C is the number of bands.</p></aside><dl id="37677bb8_216" data-style="title-left" data-title-width="medium"><dt id="37677bb8_217" data-expandable="false">scale_0_1_per_band</dt><dd><p><b id="37677bb8_218">Scales the NDArray bands to [0, 1] per band.</b></p><svg xmlns="http://www.w3.org/2000/svg" width="32.393ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 14317.9 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-1-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-1-TEX-I-1D465" d="M52 289Q59 331 106 386T222 442Q257 442 286 424T329 379Q371 442 430 442Q467 442 494 420T522 361Q522 332 508 314T481 292T458 288Q439 288 427 299T415 328Q415 374 465 391Q454 404 425 404Q412 404 406 402Q368 386 350 336Q290 115 290 78Q290 50 306 38T341 26Q378 26 414 59T463 140Q466 150 469 151T485 153H489Q504 153 504 145Q504 144 502 134Q486 77 440 33T333 -11Q263 -11 227 52Q186 -10 133 -10H127Q78 -10 57 16T35 71Q35 103 54 123T99 143Q142 143 142 101Q142 81 130 66T107 46T94 41L91 40Q91 39 97 36T113 29T132 26Q168 26 194 71Q203 87 217 139T245 247T261 313Q266 340 266 352Q266 380 251 392T217 404Q177 404 142 372T93 290Q91 281 88 280T72 278H58Q52 284 52 289Z"></path><path id="MJX-1-TEX-N-2212" d="M84 237T84 250T98 270H679Q694 262 694 250T679 230H98Q84 237 84 250Z"></path><path id="MJX-1-TEX-N-6D" d="M41 46H55Q94 46 102 60V68Q102 77 102 91T102 122T103 161T103 203Q103 234 103 269T102 328V351Q99 370 88 376T43 385H25V408Q25 431 27 431L37 432Q47 433 65 434T102 436Q119 437 138 438T167 441T178 442H181V402Q181 364 182 364T187 369T199 384T218 402T247 421T285 437Q305 442 336 442Q351 442 364 440T387 434T406 426T421 417T432 406T441 395T448 384T452 374T455 366L457 361L460 365Q463 369 466 373T475 384T488 397T503 410T523 422T546 432T572 439T603 442Q729 442 740 329Q741 322 741 190V104Q741 66 743 59T754 49Q775 46 803 46H819V0H811L788 1Q764 2 737 2T699 3Q596 3 587 0H579V46H595Q656 46 656 62Q657 64 657 200Q656 335 655 343Q649 371 635 385T611 402T585 404Q540 404 506 370Q479 343 472 315T464 232V168V108Q464 78 465 68T468 55T477 49Q498 46 526 46H542V0H534L510 1Q487 2 460 2T422 3Q319 3 310 0H302V46H318Q379 46 379 62Q380 64 380 200Q379 335 378 343Q372 371 358 385T334 402T308 404Q263 404 229 370Q202 343 195 315T187 232V168V108Q187 78 188 68T191 55T200 49Q221 46 249 46H265V0H257L234 1Q210 2 183 2T145 3Q42 3 33 0H25V46H41Z"></path><path id="MJX-1-TEX-N-69" d="M69 609Q69 637 87 653T131 669Q154 667 171 652T188 609Q188 579 171 564T129 549Q104 549 87 564T69 609ZM247 0Q232 3 143 3Q132 3 106 3T56 1L34 0H26V46H42Q70 46 91 49Q100 53 102 60T104 102V205V293Q104 345 102 359T88 378Q74 385 41 385H30V408Q30 431 32 431L42 432Q52 433 70 434T106 436Q123 437 142 438T171 441T182 442H185V62Q190 52 197 50T232 46H255V0H247Z"></path><path id="MJX-1-TEX-N-6E" d="M41 46H55Q94 46 102 60V68Q102 77 102 91T102 122T103 161T103 203Q103 234 103 269T102 328V351Q99 370 88 376T43 385H25V408Q25 431 27 431L37 432Q47 433 65 434T102 436Q119 437 138 438T167 441T178 442H181V402Q181 364 182 364T187 369T199 384T218 402T247 421T285 437Q305 442 336 442Q450 438 463 329Q464 322 464 190V104Q464 66 466 59T477 49Q498 46 526 46H542V0H534L510 1Q487 2 460 2T422 3Q319 3 310 0H302V46H318Q379 46 379 62Q380 64 380 200Q379 335 378 343Q372 371 358 385T334 402T308 404Q263 404 229 370Q202 343 195 315T187 232V168V108Q187 78 188 68T191 55T200 49Q221 46 249 46H265V0H257L234 1Q210 2 183 2T145 3Q42 3 33 0H25V46H41Z"></path><path id="MJX-1-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path><path id="MJX-1-TEX-N-2F" d="M423 750Q432 750 438 744T444 730Q444 725 271 248T92 -240Q85 -250 75 -250Q68 -250 62 -245T56 -231Q56 -221 230 257T407 740Q411 750 423 750Z"></path><path id="MJX-1-TEX-N-61" d="M137 305T115 305T78 320T63 359Q63 394 97 421T218 448Q291 448 336 416T396 340Q401 326 401 309T402 194V124Q402 76 407 58T428 40Q443 40 448 56T453 109V145H493V106Q492 66 490 59Q481 29 455 12T400 -6T353 12T329 54V58L327 55Q325 52 322 49T314 40T302 29T287 17T269 6T247 -2T221 -8T190 -11Q130 -11 82 20T34 107Q34 128 41 147T68 188T116 225T194 253T304 268H318V290Q318 324 312 340Q290 411 215 411Q197 411 181 410T156 406T148 403Q170 388 170 359Q170 334 154 320ZM126 106Q126 75 150 51T209 26Q247 26 276 49T315 109Q317 116 318 175Q318 233 317 233Q309 233 296 232T251 223T193 203T147 166T126 106Z"></path><path id="MJX-1-TEX-N-78" d="M201 0Q189 3 102 3Q26 3 17 0H11V46H25Q48 47 67 52T96 61T121 78T139 96T160 122T180 150L226 210L168 288Q159 301 149 315T133 336T122 351T113 363T107 370T100 376T94 379T88 381T80 383Q74 383 44 385H16V431H23Q59 429 126 429Q219 429 229 431H237V385Q201 381 201 369Q201 367 211 353T239 315T268 274L272 270L297 304Q329 345 329 358Q329 364 327 369T322 376T317 380T310 384L307 385H302V431H309Q324 428 408 428Q487 428 493 431H499V385H492Q443 385 411 368Q394 360 377 341T312 257L296 236L358 151Q424 61 429 57T446 50Q464 46 499 46H516V0H510H502Q494 1 482 1T457 2T432 2T414 3Q403 3 377 3T327 1L304 0H295V46H298Q309 46 320 51T331 63Q331 65 291 120L250 175Q249 174 219 133T185 88Q181 83 181 74Q181 63 188 55T206 46Q208 46 208 23V0H201Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mo"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(389,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(1183.2,0)"><use data-c="2212" xlink:href="#MJX-1-TEX-N-2212"></use></g><g data-mml-node="mo" transform="translate(2183.4,0)"><use data-c="6D" xlink:href="#MJX-1-TEX-N-6D"></use><use data-c="69" xlink:href="#MJX-1-TEX-N-69" transform="translate(833,0)"></use><use data-c="6E" xlink:href="#MJX-1-TEX-N-6E" transform="translate(1111,0)"></use></g><g data-mml-node="mo" transform="translate(3850.4,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(4239.4,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(4811.4,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="mo" transform="translate(5200.4,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="TeXAtom" data-mjx-texclass="ORD" transform="translate(5589.4,0)"><g data-mml-node="mo"><use data-c="2F" xlink:href="#MJX-1-TEX-N-2F"></use></g></g><g data-mml-node="mo" transform="translate(6089.4,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mo" transform="translate(6478.4,0)"><use data-c="6D" xlink:href="#MJX-1-TEX-N-6D"></use><use data-c="61" xlink:href="#MJX-1-TEX-N-61" transform="translate(833,0)"></use><use data-c="78" xlink:href="#MJX-1-TEX-N-78" transform="translate(1333,0)"></use></g><g data-mml-node="mo" transform="translate(8339.4,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(8728.4,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(9300.4,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="mo" transform="translate(9911.7,0)"><use data-c="2212" xlink:href="#MJX-1-TEX-N-2212"></use></g><g data-mml-node="mo" transform="translate(10911.9,0)"><use data-c="6D" xlink:href="#MJX-1-TEX-N-6D"></use><use data-c="69" xlink:href="#MJX-1-TEX-N-69" transform="translate(833,0)"></use><use data-c="6E" xlink:href="#MJX-1-TEX-N-6E" transform="translate(1111,0)"></use></g><g data-mml-node="mo" transform="translate(12578.9,0)"><use data-c="28" xlink:href="#MJX-1-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(12967.9,0)"><use data-c="1D465" xlink:href="#MJX-1-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(13539.9,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g><g data-mml-node="mo" transform="translate(13928.9,0)"><use data-c="29" xlink:href="#MJX-1-TEX-N-29"></use></g></g></g></svg></dd><dt id="37677bb8_220" data-expandable="false">scale_normal_per_band</dt><dd><p><b id="37677bb8_221">Scales the NDArray bands to zero mean unit variance per band.</b></p><svg xmlns="http://www.w3.org/2000/svg" width="9.607ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 4246.4 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-3-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-3-TEX-I-1D465" d="M52 289Q59 331 106 386T222 442Q257 442 286 424T329 379Q371 442 430 442Q467 442 494 420T522 361Q522 332 508 314T481 292T458 288Q439 288 427 299T415 328Q415 374 465 391Q454 404 425 404Q412 404 406 402Q368 386 350 336Q290 115 290 78Q290 50 306 38T341 26Q378 26 414 59T463 140Q466 150 469 151T485 153H489Q504 153 504 145Q504 144 502 134Q486 77 440 33T333 -11Q263 -11 227 52Q186 -10 133 -10H127Q78 -10 57 16T35 71Q35 103 54 123T99 143Q142 143 142 101Q142 81 130 66T107 46T94 41L91 40Q91 39 97 36T113 29T132 26Q168 26 194 71Q203 87 217 139T245 247T261 313Q266 340 266 352Q266 380 251 392T217 404Q177 404 142 372T93 290Q91 281 88 280T72 278H58Q52 284 52 289Z"></path><path id="MJX-3-TEX-N-2212" d="M84 237T84 250T98 270H679Q694 262 694 250T679 230H98Q84 237 84 250Z"></path><path id="MJX-3-TEX-I-1D707" d="M58 -216Q44 -216 34 -208T23 -186Q23 -176 96 116T173 414Q186 442 219 442Q231 441 239 435T249 423T251 413Q251 401 220 279T187 142Q185 131 185 107V99Q185 26 252 26Q261 26 270 27T287 31T302 38T315 45T327 55T338 65T348 77T356 88T365 100L372 110L408 253Q444 395 448 404Q461 431 491 431Q504 431 512 424T523 412T525 402L449 84Q448 79 448 68Q448 43 455 35T476 26Q485 27 496 35Q517 55 537 131Q543 151 547 152Q549 153 557 153H561Q580 153 580 144Q580 138 575 117T555 63T523 13Q510 0 491 -8Q483 -10 467 -10Q446 -10 429 -4T402 11T385 29T376 44T374 51L368 45Q362 39 350 30T324 12T288 -4T246 -11Q199 -11 153 12L129 -85Q108 -167 104 -180T92 -202Q76 -216 58 -216Z"></path><path id="MJX-3-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path><path id="MJX-3-TEX-N-2F" d="M423 750Q432 750 438 744T444 730Q444 725 271 248T92 -240Q85 -250 75 -250Q68 -250 62 -245T56 -231Q56 -221 230 257T407 740Q411 750 423 750Z"></path><path id="MJX-3-TEX-I-1D70E" d="M184 -11Q116 -11 74 34T31 147Q31 247 104 333T274 430Q275 431 414 431H552Q553 430 555 429T559 427T562 425T565 422T567 420T569 416T570 412T571 407T572 401Q572 357 507 357Q500 357 490 357T476 358H416L421 348Q439 310 439 263Q439 153 359 71T184 -11ZM361 278Q361 358 276 358Q152 358 115 184Q114 180 114 178Q106 141 106 117Q106 67 131 47T188 26Q242 26 287 73Q316 103 334 153T356 233T361 278Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mo"><use data-c="28" xlink:href="#MJX-3-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(389,0)"><use data-c="1D465" xlink:href="#MJX-3-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(1183.2,0)"><use data-c="2212" xlink:href="#MJX-3-TEX-N-2212"></use></g><g data-mml-node="mi" transform="translate(2183.4,0)"><use data-c="1D707" xlink:href="#MJX-3-TEX-I-1D707"></use></g><g data-mml-node="mo" transform="translate(2786.4,0)"><use data-c="29" xlink:href="#MJX-3-TEX-N-29"></use></g><g data-mml-node="TeXAtom" data-mjx-texclass="ORD" transform="translate(3175.4,0)"><g data-mml-node="mo"><use data-c="2F" xlink:href="#MJX-3-TEX-N-2F"></use></g></g><g data-mml-node="mi" transform="translate(3675.4,0)"><use data-c="1D70E" xlink:href="#MJX-3-TEX-I-1D70E"></use></g></g></g></svg></dd><dt id="37677bb8_223" data-expandable="false">scale_static_per_band</dt><dd><p><b id="37677bb8_224">Scales the NDArray bands by a predefined configuration.</b> Take a look at <code class="code" id="37677bb8_225">frdc.conf.BAND_MAX_CONFIG</code> for an example. </p><svg xmlns="http://www.w3.org/2000/svg" width="17.379ex" height="2.262ex" role="img" focusable="false" viewBox="0 -750 7681.5 1000" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" style="vertical-align: -0.566ex;"><defs><path id="MJX-5-TEX-N-28" d="M94 250Q94 319 104 381T127 488T164 576T202 643T244 695T277 729T302 750H315H319Q333 750 333 741Q333 738 316 720T275 667T226 581T184 443T167 250T184 58T225 -81T274 -167T316 -220T333 -241Q333 -250 318 -250H315H302L274 -226Q180 -141 137 -14T94 250Z"></path><path id="MJX-5-TEX-I-1D465" d="M52 289Q59 331 106 386T222 442Q257 442 286 424T329 379Q371 442 430 442Q467 442 494 420T522 361Q522 332 508 314T481 292T458 288Q439 288 427 299T415 328Q415 374 465 391Q454 404 425 404Q412 404 406 402Q368 386 350 336Q290 115 290 78Q290 50 306 38T341 26Q378 26 414 59T463 140Q466 150 469 151T485 153H489Q504 153 504 145Q504 144 502 134Q486 77 440 33T333 -11Q263 -11 227 52Q186 -10 133 -10H127Q78 -10 57 16T35 71Q35 103 54 123T99 143Q142 143 142 101Q142 81 130 66T107 46T94 41L91 40Q91 39 97 36T113 29T132 26Q168 26 194 71Q203 87 217 139T245 247T261 313Q266 340 266 352Q266 380 251 392T217 404Q177 404 142 372T93 290Q91 281 88 280T72 278H58Q52 284 52 289Z"></path><path id="MJX-5-TEX-N-2212" d="M84 237T84 250T98 270H679Q694 262 694 250T679 230H98Q84 237 84 250Z"></path><path id="MJX-5-TEX-I-1D450" d="M34 159Q34 268 120 355T306 442Q362 442 394 418T427 355Q427 326 408 306T360 285Q341 285 330 295T319 325T330 359T352 380T366 386H367Q367 388 361 392T340 400T306 404Q276 404 249 390Q228 381 206 359Q162 315 142 235T121 119Q121 73 147 50Q169 26 205 26H209Q321 26 394 111Q403 121 406 121Q410 121 419 112T429 98T420 83T391 55T346 25T282 0T202 -11Q127 -11 81 37T34 159Z"></path><path id="MJX-5-TEX-N-30" d="M96 585Q152 666 249 666Q297 666 345 640T423 548Q460 465 460 320Q460 165 417 83Q397 41 362 16T301 -15T250 -22Q224 -22 198 -16T137 16T82 83Q39 165 39 320Q39 494 96 585ZM321 597Q291 629 250 629Q208 629 178 597Q153 571 145 525T137 333Q137 175 145 125T181 46Q209 16 250 16Q290 16 318 46Q347 76 354 130T362 333Q362 478 354 524T321 597Z"></path><path id="MJX-5-TEX-N-29" d="M60 749L64 750Q69 750 74 750H86L114 726Q208 641 251 514T294 250Q294 182 284 119T261 12T224 -76T186 -143T145 -194T113 -227T90 -246Q87 -249 86 -250H74Q66 -250 63 -250T58 -247T55 -238Q56 -237 66 -225Q221 -64 221 250T66 725Q56 737 55 738Q55 746 60 749Z"></path><path id="MJX-5-TEX-N-2F" d="M423 750Q432 750 438 744T444 730Q444 725 271 248T92 -240Q85 -250 75 -250Q68 -250 62 -245T56 -231Q56 -221 230 257T407 740Q411 750 423 750Z"></path><path id="MJX-5-TEX-N-31" d="M213 578L200 573Q186 568 160 563T102 556H83V602H102Q149 604 189 617T245 641T273 663Q275 666 285 666Q294 666 302 660V361L303 61Q310 54 315 52T339 48T401 46H427V0H416Q395 3 257 3Q121 3 100 0H88V46H114Q136 46 152 46T177 47T193 50T201 52T207 57T213 61V578Z"></path></defs><g stroke="currentColor" fill="currentColor" stroke-width="0" transform="scale(1,-1)"><g data-mml-node="math"><g data-mml-node="mo"><use data-c="28" xlink:href="#MJX-5-TEX-N-28"></use></g><g data-mml-node="mi" transform="translate(389,0)"><use data-c="1D465" xlink:href="#MJX-5-TEX-I-1D465"></use></g><g data-mml-node="mo" transform="translate(1183.2,0)"><use data-c="2212" xlink:href="#MJX-5-TEX-N-2212"></use></g><g data-mml-node="msub" transform="translate(2183.4,0)"><g data-mml-node="mi"><use data-c="1D450" xlink:href="#MJX-5-TEX-I-1D450"></use></g><g data-mml-node="mn" transform="translate(466,-150) scale(0.707)"><use data-c="30" xlink:href="#MJX-5-TEX-N-30"></use></g></g><g data-mml-node="mo" transform="translate(3053,0)"><use data-c="29" xlink:href="#MJX-5-TEX-N-29"></use></g><g data-mml-node="TeXAtom" data-mjx-texclass="ORD" transform="translate(3442,0)"><g data-mml-node="mo"><use data-c="2F" xlink:href="#MJX-5-TEX-N-2F"></use></g></g><g data-mml-node="mo" transform="translate(3942,0)"><use data-c="28" xlink:href="#MJX-5-TEX-N-28"></use></g><g data-mml-node="msub" transform="translate(4331,0)"><g data-mml-node="mi"><use data-c="1D450" xlink:href="#MJX-5-TEX-I-1D450"></use></g><g data-mml-node="mn" transform="translate(466,-150) scale(0.707)"><use data-c="31" xlink:href="#MJX-5-TEX-N-31"></use></g></g><g data-mml-node="mo" transform="translate(5422.8,0)"><use data-c="2212" xlink:href="#MJX-5-TEX-N-2212"></use></g><g data-mml-node="msub" transform="translate(6423,0)"><g data-mml-node="mi"><use data-c="1D450" xlink:href="#MJX-5-TEX-I-1D450"></use></g><g data-mml-node="mn" transform="translate(466,-150) scale(0.707)"><use data-c="30" xlink:href="#MJX-5-TEX-N-30"></use></g></g><g data-mml-node="mo" transform="translate(7292.5,0)"><use data-c="29" xlink:href="#MJX-5-TEX-N-29"></use></g></g></g></svg></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><div class="code-block" data-lang="python"         >
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.scale import (
     scale_0_1_per_band, scale_normal_per_band, scale_static_per_band
 )
 from frdc.conf import BAND_MAX_CONFIG
 
-ds = FRDCDataset(site='chestnut_nature_park',
-                 date='20201218',
-                 version=None, )
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 ar_01 = scale_0_1_per_band(ar)
 ar_norm = scale_normal_per_band(ar)
 ar_static = scale_static_per_band(ar, order, BAND_MAX_CONFIG)
-</div><aside class="prompt" data-type="tip" data-title="" id="d5a9e2d8_146"><p id="d5a9e2d8_147">The static scaling has a default config, which was inferred by our capturing device.</p></aside></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="load-gcs.html">load.gcs</a>   <a class="navigation-links__next" href="preprocessing-extract-segments.html">preprocessing.extract_segments</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><aside class="prompt" data-type="tip" data-title="" id="37677bb8_228"><p id="37677bb8_229">The static scaling has a default config, which was inferred by our capturing device.</p></aside></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="load-gcs.html">load.gcs</a>   <a class="navigation-links__next" href="preprocessing-extract-segments.html">preprocessing.extract_segments</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/retrieve-our-datasets.html b/docs/retrieve-our-datasets.html
index 644e51f5..0f0ef2d9 100644
--- a/docs/retrieve-our-datasets.html
+++ b/docs/retrieve-our-datasets.html
@@ -1,10 +1,10 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.0968833"><meta name="build-number" content="${buildNumber}">       <title>Retrieve our Datasets | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"prerequisites","level":0,"title":"Prerequisites","anchor":"#prerequisites"},{"id":"retrieve-the-data","level":0,"title":"Retrieve the Data","anchor":"#retrieve-the-data"},{"id":"segment-the-data","level":0,"title":"Segment the Data","anchor":"#segment-the-data"},{"id":"plot-the-data-optional","level":0,"title":"Plot the Data (Optional)","anchor":"#plot-the-data-optional"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Retrieve our Datasets | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/retrieve-our-datasets.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Retrieve our Datasets | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/retrieve-our-datasets.html#webpage", "url": "/d/0.0.7/retrieve-our-datasets.html", "name": "Retrieve our Datasets | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Retrieve-our-Datasets" data-main-title="Retrieve our Datasets" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="Tutorials"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Retrieve-our-Datasets"   id="Retrieve-our-Datasets.md">Retrieve our Datasets</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;2119d5ce_228\&quot;\u003eA tutorial to retrieve our datasets\u003c/p\u003e&quot;]}"></div> <p id="2119d5ce_139">In this tutorial, we'll learn how to :</p><ul class="list _ul" id="2119d5ce_140"><li class="list__item" id="2119d5ce_141"><p>Retrieve FRDC's Hyperspectral Image Data as <code class="code" id="2119d5ce_142">np.ndarray</code></p></li><li class="list__item" id="2119d5ce_143"><p>Retrieve FRDC's Ground Truth bounds and labels</p></li><li class="list__item" id="2119d5ce_144"><p>Slice/segment the image data by the bounds</p></li></ul><section class="chapter"><h2 id="prerequisites" data-toc="prerequisites"   >Prerequisites</h2><ul class="list _ul" id="2119d5ce_145"><li class="list__item" id="2119d5ce_146"><p>New here? <a href="getting-started.html" id="2119d5ce_147" data-tooltip="Before starting development, take a look at our repository structure. This will help you understand where to put your code."  >Get Started</a>.</p></li><li class="list__item" id="2119d5ce_148"><p>Setup the Google Cloud Authorization to download the data.</p></li></ul></section><section class="chapter"><h2 id="retrieve-the-data" data-toc="retrieve-the-data"   >Retrieve the Data</h2><p id="2119d5ce_149">To retrieve the data, use <a href="load-dataset.html" id="2119d5ce_150" data-tooltip="You need to Set-Up Google Cloud with the appropriate permissions to use this library."  >FRDCDataset</a></p><p id="2119d5ce_151">Here, we'll download and load our</p><ul class="list _ul" id="2119d5ce_152"><li class="list__item" id="2119d5ce_153"><p><code class="code" id="2119d5ce_154">ar</code>: Hyperspectral Image Data</p></li><li class="list__item" id="2119d5ce_155"><p><code class="code" id="2119d5ce_156">order</code>: The order of the bands</p></li><li class="list__item" id="2119d5ce_157"><p><code class="code" id="2119d5ce_158">bounds</code>: The bounds of the trees (segments)</p></li><li class="list__item" id="2119d5ce_159"><p><code class="code" id="2119d5ce_160">labels</code>: The labels of the trees (segments)</p></li></ul><div class="code-block" data-lang="python"         >
-from frdc.load.dataset import FRDCDataset
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3926211"><meta name="build-number" content="${buildNumber}">       <title>Retrieve our Datasets | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"prerequisites","level":0,"title":"Prerequisites","anchor":"#prerequisites"},{"id":"retrieve-the-data","level":0,"title":"Retrieve the Data","anchor":"#retrieve-the-data"},{"id":"segment-the-data","level":0,"title":"Segment the Data","anchor":"#segment-the-data"},{"id":"plot-the-data-optional","level":0,"title":"Plot the Data (Optional)","anchor":"#plot-the-data-optional"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="Retrieve our Datasets | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/retrieve-our-datasets.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="Retrieve our Datasets | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/retrieve-our-datasets.html#webpage", "url": "/d/0.0.8/retrieve-our-datasets.html", "name": "Retrieve our Datasets | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="Retrieve-our-Datasets" data-main-title="Retrieve our Datasets" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="Tutorials"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="Retrieve-our-Datasets"   id="Retrieve-our-Datasets.md">Retrieve our Datasets</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;515430c7_1746\&quot;\u003eA tutorial to retrieve our datasets\u003c/p\u003e&quot;]}"></div> <p id="515430c7_1656">In this tutorial, we'll learn how to :</p><ul class="list _ul" id="515430c7_1657"><li class="list__item" id="515430c7_1658"><p>Retrieve FRDC's Hyperspectral Image Data as <code class="code" id="515430c7_1659">np.ndarray</code></p></li><li class="list__item" id="515430c7_1660"><p>Retrieve FRDC's Ground Truth bounds and labels</p></li><li class="list__item" id="515430c7_1661"><p>Slice/segment the image data by the bounds</p></li></ul><section class="chapter"><h2 id="prerequisites" data-toc="prerequisites"   >Prerequisites</h2><ul class="list _ul" id="515430c7_1662"><li class="list__item" id="515430c7_1663"><p>New here? <a href="getting-started.html" id="515430c7_1664" data-tooltip="Want to use a Dev Container? See Get Started with Dev Containers"  >Get Started</a>.</p></li><li class="list__item" id="515430c7_1665"><p>Setup the Google Cloud Authorization to download the data.</p></li></ul></section><section class="chapter"><h2 id="retrieve-the-data" data-toc="retrieve-the-data"   >Retrieve the Data</h2><p id="515430c7_1666">To retrieve the data, use <a href="load-dataset.html" id="515430c7_1667" data-tooltip="You need to Set-Up Google Cloud with the appropriate permissions to use this library."  >FRDCDataset</a></p><p id="515430c7_1668">Here, we'll download and load our</p><ul class="list _ul" id="515430c7_1669"><li class="list__item" id="515430c7_1670"><p><code class="code" id="515430c7_1671">ar</code>: Hyperspectral Image Data</p></li><li class="list__item" id="515430c7_1672"><p><code class="code" id="515430c7_1673">order</code>: The order of the bands</p></li><li class="list__item" id="515430c7_1674"><p><code class="code" id="515430c7_1675">bounds</code>: The bounds of the trees (segments)</p></li><li class="list__item" id="515430c7_1676"><p><code class="code" id="515430c7_1677">labels</code>: The labels of the trees (segments)</p></li></ul><div class="code-block" data-lang="python"         >
+from frdc.load.preset import FRDCDatasetPreset
 
-ds = FRDCDataset(site=&quot;chestnut_nature_park&quot;, date=&quot;20201218&quot;, version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
-</div><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="what-datasets-are-there" data-toc="what-datasets-are-there"   >What Datasets are there?</h3></div><div class="collapse__content"><aside class="prompt" data-type="tip" data-title="" id="2119d5ce_162"><p id="2119d5ce_163">To know what datasets are available, you can run <a href="load-gcs.html" id="2119d5ce_164" data-tooltip="Set-Up Google Cloud to use this library."  >load.gcs</a>'s <code class="code" id="2119d5ce_165">list_gcs_datasets()</code> method</p></aside><aside class="prompt" data-type="warning" data-title="" id="2119d5ce_166"><p id="2119d5ce_167">Note that some datasets do not have <code class="code" id="2119d5ce_168">bounds</code> and <code class="code" id="2119d5ce_169">labels</code> available as they have not been annotated yet.</p></aside><div class="code-block" data-lang="python"         >
+</div><section class="chapter"><div class="collapse"><div class="collapse__title"><h3 id="what-datasets-are-there" data-toc="what-datasets-are-there"   >What Datasets are there?</h3></div><div class="collapse__content"><aside class="prompt" data-type="tip" data-title="" id="515430c7_1679"><p id="515430c7_1680">We recommend to use FRDCDatasetPreset. However, if you want<br> to know what other datasets are available, you can run <a href="load-gcs.html" id="515430c7_1682" data-tooltip="Set-Up Google Cloud to use this library."  >load.gcs</a>'s <code class="code" id="515430c7_1683">list_gcs_datasets()</code> method</p></aside><aside class="prompt" data-type="warning" data-title="" id="515430c7_1684"><p id="515430c7_1685">Note that some datasets do not have <code class="code" id="515430c7_1686">bounds</code> and <code class="code" id="515430c7_1687">labels</code> available as they have not been annotated yet.</p></aside><div class="code-block" data-lang="python"         >
 from frdc.load.gcs import list_gcs_datasets 
 print(list_gcs_datasets())
 # 0  DEBUG/0
@@ -12,22 +12,22 @@
 # 2  casuarina/20220418/93deg
 # 3  chestnut_nature_park/20201218
 # ...
-</div><ul class="list _ul" id="2119d5ce_171"><li class="list__item" id="2119d5ce_172"><p>The first part of the path is the <code class="code" id="2119d5ce_173">site</code>, and the second part is the <code class="code" id="2119d5ce_174">date</code>.</p></li><li class="list__item" id="2119d5ce_175"><p>The <code class="code" id="2119d5ce_176">version</code> is the rest of the path, if there isn't any, use <code class="code" id="2119d5ce_177">None</code>.</p></li></ul><div class="tabs" id="2119d5ce_178"><div class="tabs__content" data-gtm="tab" id="2119d5ce_179" data-title="ds/date/ver/"><ul class="list _ul" id="2119d5ce_180"><li class="list__item" id="2119d5ce_181"><p><code class="code" id="2119d5ce_182">site=&quot;ds&quot;</code></p></li><li class="list__item" id="2119d5ce_183"><p><code class="code" id="2119d5ce_184">date=&quot;date&quot;</code></p></li><li class="list__item" id="2119d5ce_185"><p><code class="code" id="2119d5ce_186">version=&quot;ver&quot;</code></p></li></ul></div><div class="tabs__content" data-gtm="tab" id="2119d5ce_187" data-title="ds/date/ver/01/data/"><ul class="list _ul" id="2119d5ce_188"><li class="list__item" id="2119d5ce_189"><p><code class="code" id="2119d5ce_190">site=&quot;ds&quot;</code></p></li><li class="list__item" id="2119d5ce_191"><p><code class="code" id="2119d5ce_192">date=&quot;date&quot;</code></p></li><li class="list__item" id="2119d5ce_193"><p><code class="code" id="2119d5ce_194">version=&quot;ver/01/data&quot;</code></p></li></ul></div><div class="tabs__content" data-gtm="tab" id="2119d5ce_195" data-title="ds/date/"><ul class="list _ul" id="2119d5ce_196"><li class="list__item" id="2119d5ce_197"><p><code class="code" id="2119d5ce_198">site=&quot;ds&quot;</code></p></li><li class="list__item" id="2119d5ce_199"><p><code class="code" id="2119d5ce_200">date=&quot;date&quot;</code></p></li><li class="list__item" id="2119d5ce_201"><p><code class="code" id="2119d5ce_202">version=None</code></p></li></ul></div></div></div></div></section></section><section class="chapter"><h2 id="segment-the-data" data-toc="segment-the-data"   >Segment the Data</h2><p id="2119d5ce_203">To segment the data, use <a href="preprocessing-extract-segments.html" id="2119d5ce_204" data-tooltip="A boundary is a Rect object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates."  >Extract Segments</a>.</p><p id="2119d5ce_205">Here, we'll segment the data by the bounds.</p><div class="code-block" data-lang="python"         >
-from frdc.load.dataset import FRDCDataset
+</div><ul class="list _ul" id="515430c7_1689"><li class="list__item" id="515430c7_1690"><p>The first part of the path is the <code class="code" id="515430c7_1691">site</code>, and the second part is the <code class="code" id="515430c7_1692">date</code>.</p></li><li class="list__item" id="515430c7_1693"><p>The <code class="code" id="515430c7_1694">version</code> is the rest of the path, if there isn't any, use <code class="code" id="515430c7_1695">None</code>.</p></li></ul><div class="tabs" id="515430c7_1696"><div class="tabs__content" data-gtm="tab" id="515430c7_1697" data-title="ds/date/ver/"><ul class="list _ul" id="515430c7_1698"><li class="list__item" id="515430c7_1699"><p><code class="code" id="515430c7_1700">site=&quot;ds&quot;</code></p></li><li class="list__item" id="515430c7_1701"><p><code class="code" id="515430c7_1702">date=&quot;date&quot;</code></p></li><li class="list__item" id="515430c7_1703"><p><code class="code" id="515430c7_1704">version=&quot;ver&quot;</code></p></li></ul></div><div class="tabs__content" data-gtm="tab" id="515430c7_1705" data-title="ds/date/ver/01/data/"><ul class="list _ul" id="515430c7_1706"><li class="list__item" id="515430c7_1707"><p><code class="code" id="515430c7_1708">site=&quot;ds&quot;</code></p></li><li class="list__item" id="515430c7_1709"><p><code class="code" id="515430c7_1710">date=&quot;date&quot;</code></p></li><li class="list__item" id="515430c7_1711"><p><code class="code" id="515430c7_1712">version=&quot;ver/01/data&quot;</code></p></li></ul></div><div class="tabs__content" data-gtm="tab" id="515430c7_1713" data-title="ds/date/"><ul class="list _ul" id="515430c7_1714"><li class="list__item" id="515430c7_1715"><p><code class="code" id="515430c7_1716">site=&quot;ds&quot;</code></p></li><li class="list__item" id="515430c7_1717"><p><code class="code" id="515430c7_1718">date=&quot;date&quot;</code></p></li><li class="list__item" id="515430c7_1719"><p><code class="code" id="515430c7_1720">version=None</code></p></li></ul></div></div></div></div></section></section><section class="chapter"><h2 id="segment-the-data" data-toc="segment-the-data"   >Segment the Data</h2><p id="515430c7_1721">To segment the data, use <a href="preprocessing-extract-segments.html" id="515430c7_1722" data-tooltip="A boundary is a Rect object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates."  >Extract Segments</a>.</p><p id="515430c7_1723">Here, we'll segment the data by the bounds.</p><div class="code-block" data-lang="python"         >
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.extract_segments import extract_segments_from_bounds
 
-ds = FRDCDataset(site=&quot;chestnut_nature_park&quot;, date=&quot;20201218&quot;, version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 segments = extract_segments_from_bounds(ar, bounds)
-</div><p id="2119d5ce_207"><code class="code" id="2119d5ce_208">segments</code> is a list of <code class="code" id="2119d5ce_209">np.ndarray</code> of shape H, W, C, representing a tree. The order of <code class="code" id="2119d5ce_210">segments</code> is the same as <code class="code" id="2119d5ce_211">labels</code>, so you can use <code class="code" id="2119d5ce_212">labels</code> to identify the tree.</p><aside class="prompt" data-type="tip" data-title="" id="2119d5ce_213"><p id="2119d5ce_214">While we have not used <code class="code" id="2119d5ce_215">order</code> in our example, it's useful to determine the order of the bands in <code class="code" id="2119d5ce_216">ar</code> in other applications.</p></aside></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h2 id="plot-the-data-optional" data-toc="plot-the-data-optional"   >Plot the Data (Optional)</h2></div><div class="collapse__content"><p id="2119d5ce_217">We can then use these data to plot out the first tree segment.</p><div class="code-block" data-lang="python"         >
+</div><p id="515430c7_1725"><code class="code" id="515430c7_1726">segments</code> is a list of <code class="code" id="515430c7_1727">np.ndarray</code> of shape H, W, C, representing a tree. The order of <code class="code" id="515430c7_1728">segments</code> is the same as <code class="code" id="515430c7_1729">labels</code>, so you can use <code class="code" id="515430c7_1730">labels</code> to identify the tree.</p><aside class="prompt" data-type="tip" data-title="" id="515430c7_1731"><p id="515430c7_1732">While we have not used <code class="code" id="515430c7_1733">order</code> in our example, it's useful to determine the order of the bands in <code class="code" id="515430c7_1734">ar</code> in other applications.</p></aside></section><section class="chapter"><div class="collapse"><div class="collapse__title"><h2 id="plot-the-data-optional" data-toc="plot-the-data-optional"   >Plot the Data (Optional)</h2></div><div class="collapse__content"><p id="515430c7_1735">We can then use these data to plot out the first tree segment.</p><div class="code-block" data-lang="python"         >
 import matplotlib.pyplot as plt
 
-from frdc.load.dataset import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 from frdc.preprocess.extract_segments import extract_segments_from_bounds
 from frdc.preprocess.scale import scale_0_1_per_band
 
-ds = FRDCDataset(site=&quot;chestnut_nature_park&quot;, date=&quot;20201218&quot;, version=None)
+ds = FRDCDatasetPreset.chestnut_20201218()
 ar, order = ds.get_ar_bands()
 bounds, labels = ds.get_bounds_and_labels()
 segments = extract_segments_from_bounds(ar, bounds)
@@ -38,4 +38,4 @@
 plt.imshow(segment_0_rgb_scaled)
 plt.title(f&quot;Tree {labels[0]}&quot;)
 plt.show()
-</div><p id="2119d5ce_219">See also: <a href="preprocessing-scale.html" id="2119d5ce_220" data-tooltip="The static scaling has a default config, which was inferred by our capturing device."  >preprocessing.scale.scale_0_1_per_band</a></p><p id="2119d5ce_221">MatPlotLib cannot show the data correctly as-is, so we need to</p><ul class="list _ul" id="2119d5ce_222"><li class="list__item" id="2119d5ce_223"><p>Convert the data from BGR to RGB</p></li><li class="list__item" id="2119d5ce_224"><p>Scale the data to 0-1 per band</p></li></ul><aside class="prompt" data-type="note" data-title="" id="2119d5ce_225"><p id="2119d5ce_226">Remember that the library returns the band <code class="code" id="2119d5ce_227">order</code>? This is useful in debugging the data. If we had shown it in BGR, it'll look off!</p></aside></div></div></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="getting-started.html">Getting Started</a>   <a class="navigation-links__next" href="mix-match.html">MixMatch</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><p id="515430c7_1737">See also: <a href="preprocessing-scale.html" id="515430c7_1738" data-tooltip="The static scaling has a default config, which was inferred by our capturing device."  >preprocessing.scale.scale_0_1_per_band</a></p><p id="515430c7_1739">MatPlotLib cannot show the data correctly as-is, so we need to</p><ul class="list _ul" id="515430c7_1740"><li class="list__item" id="515430c7_1741"><p>Convert the data from BGR to RGB</p></li><li class="list__item" id="515430c7_1742"><p>Scale the data to 0-1 per band</p></li></ul><aside class="prompt" data-type="note" data-title="" id="515430c7_1743"><p id="515430c7_1744">Remember that the library returns the band <code class="code" id="515430c7_1745">order</code>? This is useful in debugging the data. If we had shown it in BGR, it'll look off!</p></aside></div></div></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="get-started-with-dev-containers.html">Get Started with Dev Containers</a>   <a class="navigation-links__next" href="mix-match.html">MixMatch</a>  </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/docs/train-frdc-lightning.html b/docs/train-frdc-lightning.html
index ebcd6054..2bdfd346 100644
--- a/docs/train-frdc-lightning.html
+++ b/docs/train-frdc-lightning.html
@@ -1,4 +1,4 @@
-<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-20T12:31:22.095883"><meta name="build-number" content="${buildNumber}">       <title>train.frdc_datamodule &amp; frdc_module | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"classes","level":0,"title":"Classes","anchor":"#classes"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="train.frdc_datamodule &amp; frdc_module | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.7/train-frdc-lightning.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="train.frdc_datamodule &amp; frdc_module | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.7/train-frdc-lightning.html#webpage", "url": "/d/0.0.7/train-frdc-lightning.html", "name": "train.frdc_datamodule &amp; frdc_module | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="train.frdc_lightning" data-main-title="train.frdc_datamodule &amp; frdc_module" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.7 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="train.frdc_lightning"   id="train.frdc_lightning.md">train.frdc_datamodule &amp; frdc_module</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;aab859be_176\&quot;\u003eThe FRDC PyTorch LightningDataModule and LightningModule.\u003c/p\u003e&quot;]}"></div> <p id="aab859be_129">These are FRDC specific LightningDataModule and LightningModule, a core component in the PyTorch Lightning ecosystem to provide a simple interface to train and evaluate models.</p><section class="chapter"><h2 id="classes" data-toc="classes"   >Classes</h2><aside class="prompt" data-type="note" data-title="" id="aab859be_130"><p id="aab859be_131">It's optional to use these classes, you can use your own training loop if you want. We'll use these for our training pipeline.</p></aside><dl id="aab859be_132" data-style="title-left" data-title-width="medium"><dt id="aab859be_133" data-expandable="false">FRDCDataModule</dt><dd><p><b id="aab859be_134">The FRDC PyTorch Lightning DataModule.</b></p></dd><dt id="aab859be_135" data-expandable="false">FRDCModule</dt><dd><p><b id="aab859be_136">The FRDC PyTorch Lightning Module.</b></p></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><aside class="prompt" data-type="tip" data-title="" id="aab859be_137"><p id="aab859be_138">See our training pipeline for a full example</p></aside></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="aab859be_139" data-style="title-top"><dt id="aab859be_140" data-expandable="false">FRDCDataModule(segments, labels, preprocess, augmentation, train_val_test_split, batch_size)</dt><dd><p><b id="aab859be_141">Initializes the FRDC PyTorch Lightning DataModule.</b></p><br><ul class="list _ul" id="aab859be_143"><li class="list__item" id="aab859be_144"><p><code class="code" id="aab859be_145">segments</code>, <code class="code" id="aab859be_146">labels</code> are retrieved from </p><ul class="list _ul" id="aab859be_147"><li class="list__item" id="aab859be_148"><p><a href="load-dataset.html" id="aab859be_149" data-tooltip="You need to Set-Up Google Cloud with the appropriate permissions to use this library."  >FRDCDataset</a></p></li><li class="list__item" id="aab859be_150"><p><a href="preprocessing-extract-segments.html" id="aab859be_151" data-tooltip="A boundary is a Rect object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates."  >Segmentation</a></p></li></ul></li><li class="list__item" id="aab859be_152"><p><code class="code" id="aab859be_153">preprocess</code> is a function that takes in a segment and returns a preprocessed segment. In particular, it should accept a list of NumPy NDArrays and return a single stacked PyToch Tensor.</p></li><li class="list__item" id="aab859be_154"><p><code class="code" id="aab859be_155">augmentation</code> is a function that takes in a segment and returns an augmented segment. In particular, it takes in a PyTorch Tensor and returns another.</p></li><li class="list__item" id="aab859be_156"><p><code class="code" id="aab859be_157">train_val_test_split</code> is a function that takes a TensorDataset and returns a list of 3 TensorDatasets, for train, val and test respectively.</p></li><li class="list__item" id="aab859be_158"><p><code class="code" id="aab859be_159">batch_size</code> is the batch size.</p></li></ul><aside class="prompt" data-type="note" data-title="" id="aab859be_160"><p>For now, the <code class="code" id="aab859be_161">augmentation</code> is only applied to training data</p></aside></dd><dt id="aab859be_162" data-expandable="false">FRDCModule(model_cls, model_kwargs, optim_cls, optim_kwargs)</dt><dd><p><b id="aab859be_163">Initializes the FRDC PyTorch Lightning Module.</b></p><br><ul class="list _ul" id="aab859be_165"><li class="list__item" id="aab859be_166"><p><code class="code" id="aab859be_167">model_cls</code> is the Class of the model.</p></li><li class="list__item" id="aab859be_168"><p><code class="code" id="aab859be_169">model_kwargs</code> is the kwargs to pass to the model.</p></li><li class="list__item" id="aab859be_170"><p><code class="code" id="aab859be_171">optim_cls</code> is the Class of the optimizer.</p></li><li class="list__item" id="aab859be_172"><p><code class="code" id="aab859be_173">optim_kwargs</code> is the kwargs to pass to the optimizer.</p></li></ul><p> Internally, the module will initialize the model and optimizer as follows: </p><div class="code-block" data-lang="python"         >
+<!DOCTYPE html SYSTEM "about:legacy-compat"><html lang="en-US" data-colors-preset="contrast" data-primary-color="#307FFF"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="UTF-8"><meta name="robots" content="noindex">  <meta name="built-on" content="2023-12-29T11:50:44.3904386"><meta name="build-number" content="${buildNumber}">       <title>train.frdc_datamodule &amp; frdc_module | Documentation</title><script id="virtual-toc-data" type="application/json">[{"id":"classes","level":0,"title":"Classes","anchor":"#classes"},{"id":"usage","level":0,"title":"Usage","anchor":"#usage"},{"id":"api","level":0,"title":"API","anchor":"#api"}]</script><script id="topic-shortcuts" type="application/json"></script><link href="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.css" rel="stylesheet">   <link rel="apple-touch-icon" sizes="180x180" href="https://jetbrains.com/apple-touch-icon.png"><link rel="icon" type="image/png" sizes="32x32" href="https://jetbrains.com/favicon-32x32.png"><link rel="icon" type="image/png" sizes="16x16" href="https://jetbrains.com/favicon-16x16.png"><link rel="manifest" href="https://jetbrains.com/site.webmanifest"><link rel="mask-icon" href="https://jetbrains.com/safari-pinned-tab.svg" color="#000000"><meta name="msapplication-TileColor" content="#000000"/><meta name="msapplication-TileImage" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-144x144.png"/><meta name="msapplication-square70x70logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-70x70.png"/><meta name="msapplication-square150x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-150x150.png"/><meta name="msapplication-wide310x150logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x150.png"/><meta name="msapplication-square310x310logo" content="https://resources.jetbrains.com/storage/ui/favicons/mstile-310x310.png"/>  <meta name="image" content=""><!-- Open Graph --><meta property="og:title" content="train.frdc_datamodule &amp; frdc_module | Documentation"/><meta property="og:description" content=""/><meta property="og:image" content=""/><meta property="og:site_name" content="Documentation Help"/><meta property="og:type" content="website"/><meta property="og:locale" content="en_US"/><meta property="og:url" content="/d/0.0.8/train-frdc-lightning.html"/><!-- End Open Graph --><!-- Twitter Card --><meta name="twitter:card" content="summary_large_image"><meta name="twitter:site" content=""><meta name="twitter:title" content="train.frdc_datamodule &amp; frdc_module | Documentation"><meta name="twitter:description" content=""><meta name="twitter:creator" content=""><meta name="twitter:image:src" content=""><!-- End Twitter Card --><!-- Schema.org WebPage --><script type="application/ld+json"> { "@context": "http://schema.org", "@type": "WebPage", "@id": "/d/0.0.8/train-frdc-lightning.html#webpage", "url": "/d/0.0.8/train-frdc-lightning.html", "name": "train.frdc_datamodule &amp; frdc_module | Documentation", "description": "", "image": "", "inLanguage":"en-US" }</script><!-- End Schema.org --><!-- Schema.org WebSite --><script type="application/ld+json"> { "@type": "WebSite", "@id": "/d/#website", "url": "/d/", "name": "Documentation Help" }</script><!-- End Schema.org --></head>      <body data-id="train.frdc_lightning" data-main-title="train.frdc_datamodule &amp; frdc_module" data-article-props="{&quot;seeAlsoStyle&quot;:&quot;links&quot;}"  data-template="article"  data-breadcrumbs="API"  >   <div class="wrapper"><main class="panel _main"><header class="panel__header"><div class="container"><h3>Documentation 0.0.8 Help</h3><div class="panel-trigger"></div></div></header><section class="panel__content"><div class="container"><article class="article" data-shortcut-switcher="inactive"><h1 data-toc="train.frdc_lightning"   id="train.frdc_lightning.md">train.frdc_datamodule &amp; frdc_module</h1> <div class="micro-format" data-content="{&quot;microFormat&quot;:[&quot;\u003cp id\u003d\&quot;4ad0d01_223\&quot;\u003eThe FRDC PyTorch LightningDataModule and LightningModule.\u003c/p\u003e&quot;]}"></div> <p id="4ad0d01_176">These are FRDC specific LightningDataModule and LightningModule, a core component in the PyTorch Lightning ecosystem to provide a simple interface to train and evaluate models.</p><section class="chapter"><h2 id="classes" data-toc="classes"   >Classes</h2><aside class="prompt" data-type="note" data-title="" id="4ad0d01_177"><p id="4ad0d01_178">It's optional to use these classes, you can use your own training loop if you want. We'll use these for our training pipeline.</p></aside><dl id="4ad0d01_179" data-style="title-left" data-title-width="medium"><dt id="4ad0d01_180" data-expandable="false">FRDCDataModule</dt><dd><p><b id="4ad0d01_181">The FRDC PyTorch Lightning DataModule.</b></p></dd><dt id="4ad0d01_182" data-expandable="false">FRDCModule</dt><dd><p><b id="4ad0d01_183">The FRDC PyTorch Lightning Module.</b></p></dd></dl></section><section class="chapter"><h2 id="usage" data-toc="usage"   >Usage</h2><aside class="prompt" data-type="tip" data-title="" id="4ad0d01_184"><p id="4ad0d01_185">See our training pipeline for a full example</p></aside></section><section class="chapter"><h2 id="api" data-toc="api"   >API</h2><dl id="4ad0d01_186" data-style="title-top"><dt id="4ad0d01_187" data-expandable="false">FRDCDataModule(segments, labels, preprocess, augmentation, train_val_test_split, batch_size)</dt><dd><p><b id="4ad0d01_188">Initializes the FRDC PyTorch Lightning DataModule.</b></p><br><ul class="list _ul" id="4ad0d01_190"><li class="list__item" id="4ad0d01_191"><p><code class="code" id="4ad0d01_192">segments</code>, <code class="code" id="4ad0d01_193">labels</code> are retrieved from </p><ul class="list _ul" id="4ad0d01_194"><li class="list__item" id="4ad0d01_195"><p><a href="load-dataset.html" id="4ad0d01_196" data-tooltip="You need to Set-Up Google Cloud with the appropriate permissions to use this library."  >FRDCDataset</a></p></li><li class="list__item" id="4ad0d01_197"><p><a href="preprocessing-extract-segments.html" id="4ad0d01_198" data-tooltip="A boundary is a Rect object that represents the minimum bounding box of a segment, with x0, y0, x1, y1 coordinates."  >Segmentation</a></p></li></ul></li><li class="list__item" id="4ad0d01_199"><p><code class="code" id="4ad0d01_200">preprocess</code> is a function that takes in a segment and returns a preprocessed segment. In particular, it should accept a list of NumPy NDArrays and return a single stacked PyToch Tensor.</p></li><li class="list__item" id="4ad0d01_201"><p><code class="code" id="4ad0d01_202">augmentation</code> is a function that takes in a segment and returns an augmented segment. In particular, it takes in a PyTorch Tensor and returns another.</p></li><li class="list__item" id="4ad0d01_203"><p><code class="code" id="4ad0d01_204">train_val_test_split</code> is a function that takes a TensorDataset and returns a list of 3 TensorDatasets, for train, val and test respectively.</p></li><li class="list__item" id="4ad0d01_205"><p><code class="code" id="4ad0d01_206">batch_size</code> is the batch size.</p></li></ul><aside class="prompt" data-type="note" data-title="" id="4ad0d01_207"><p>For now, the <code class="code" id="4ad0d01_208">augmentation</code> is only applied to training data</p></aside></dd><dt id="4ad0d01_209" data-expandable="false">FRDCModule(model_cls, model_kwargs, optim_cls, optim_kwargs)</dt><dd><p><b id="4ad0d01_210">Initializes the FRDC PyTorch Lightning Module.</b></p><br><ul class="list _ul" id="4ad0d01_212"><li class="list__item" id="4ad0d01_213"><p><code class="code" id="4ad0d01_214">model_cls</code> is the Class of the model.</p></li><li class="list__item" id="4ad0d01_215"><p><code class="code" id="4ad0d01_216">model_kwargs</code> is the kwargs to pass to the model.</p></li><li class="list__item" id="4ad0d01_217"><p><code class="code" id="4ad0d01_218">optim_cls</code> is the Class of the optimizer.</p></li><li class="list__item" id="4ad0d01_219"><p><code class="code" id="4ad0d01_220">optim_kwargs</code> is the kwargs to pass to the optimizer.</p></li></ul><p> Internally, the module will initialize the model and optimizer as follows: </p><div class="code-block" data-lang="python"         >
 model = model_cls(**model_kwargs)
 optim = optim_cls(model.parameters(), **optim_kwargs)
-</div><aside class="prompt" data-type="note" data-title="" id="aab859be_175"><p>We do not accept the instances of the Model and Optimizer so that we can pickle them.</p></aside></dd></dl></section><div class="last-modified"> Last modified: 20 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-glcm-padded.html">preprocessing.glcm_padded</a>   </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
+</div><aside class="prompt" data-type="note" data-title="" id="4ad0d01_222"><p>We do not accept the instances of the Model and Optimizer so that we can pickle them.</p></aside></dd></dl></section><div class="last-modified"> Last modified: 29 December 2023</div><div data-feedback-placeholder="true"></div><div class="navigation-links _bottom">  <a class="navigation-links__prev" href="preprocessing-glcm-padded.html">preprocessing.glcm_padded</a>   </div></article><div id="disqus_thread"></div></div></section></main></div>  <script src="https://resources.jetbrains.com/writerside/apidoc/6.6.6-b205/app.js"></script></body></html>
\ No newline at end of file
diff --git a/rsc.dvc b/rsc.dvc
deleted file mode 100644
index f9ae0e31..00000000
--- a/rsc.dvc
+++ /dev/null
@@ -1,424 +0,0 @@
-outs:
-- hash: md5
-  path: rsc
-  files:
-  - relpath: DEBUG/0/bounds.csv
-    md5: ad253d8dfe0cbbc8107647b11d9a2ce2
-    size: 325
-    cloud:
-      frdc-ds:
-        etag: 08b6ab869c8de682031001
-        version_id: '1701154195084726'
-  - relpath: DEBUG/0/result.jpg
-    md5: 36e390821a45f70fc442bbd5d881f495
-    size: 7361
-    cloud:
-      frdc-ds:
-        etag: 08ccc6cc8191e682031001
-        version_id: '1701155213353804'
-  - relpath: DEBUG/0/result.tif
-    md5: c700d23b1332113e74051d0b0d187d6e
-    size: 60154
-    cloud:
-      frdc-ds:
-        etag: 0893da859c8de682031001
-        version_id: '1701154195074323'
-  - relpath: DEBUG/0/result_Blue.tif
-    md5: 663cb540356deb8811d0b779e4435bf5
-    size: 60134
-    cloud:
-      frdc-ds:
-        etag: 08fada859c8de682031001
-        version_id: '1701154195074426'
-  - relpath: DEBUG/0/result_Green.tif
-    md5: 2643f64a2e775d4ee95583e108ab5e9c
-    size: 60134
-    cloud:
-      frdc-ds:
-        etag: 08bc99869c8de682031001
-        version_id: '1701154195082428'
-  - relpath: DEBUG/0/result_NIR.tif
-    md5: 946c2eedf7e658fd9924b0a99b3282fa
-    size: 60134
-    cloud:
-      frdc-ds:
-        etag: 08879c869c8de682031001
-        version_id: '1701154195082759'
-  - relpath: DEBUG/0/result_Red.tif
-    md5: f566accc812ae46a0147b0078d0f4411
-    size: 60134
-    cloud:
-      frdc-ds:
-        etag: 0884fa869c8de682031001
-        version_id: '1701154195094788'
-  - relpath: DEBUG/0/result_RedEdge.tif
-    md5: ab998dba488a0fd7c362fab04c1b4034
-    size: 60134
-    cloud:
-      frdc-ds:
-        etag: 08a98c869c8de682031001
-        version_id: '1701154195080745'
-  - relpath: casuarina/20220418/183deg/dsm.tif
-    md5: 43260454e85e6f5795a5c17213de3334
-    size: 36290602
-    cloud:
-      frdc-ds:
-        etag: 08fd818aa08de682031001
-        version_id: '1701154203533565'
-  - relpath: casuarina/20220418/183deg/gsddsm.tif
-    md5: f67e3c112989145af0cc0b5a0478fa22
-    size: 98938
-    cloud:
-      frdc-ds:
-        etag: 08ceb6879c8de682031001
-        version_id: '1701154195102542'
-  - relpath: casuarina/20220418/183deg/result.jpg
-    md5: ceae7eab3f8a39485e3b4f5c5b7d47b3
-    size: 13379694
-    cloud:
-      frdc-ds:
-        etag: 08be83e98191e682031001
-        version_id: '1701155213820350'
-  - relpath: casuarina/20220418/183deg/result.tif
-    md5: e355405f060d55a6b7374b3542fdc3c1
-    size: 197880775
-    cloud:
-      frdc-ds:
-        etag: 08f2c3ebaf8de682031001
-        version_id: '1701154236588530'
-  - relpath: casuarina/20220418/183deg/result_Blue.tif
-    md5: 03bf7028f6527db900b95d7621463cce
-    size: 223640924
-    cloud:
-      frdc-ds:
-        etag: 08b4bf9eac8de682031001
-        version_id: '1701154229034932'
-  - relpath: casuarina/20220418/183deg/result_Green.tif
-    md5: d475aef93075d7375f38f73895d5fdb8
-    size: 226577241
-    cloud:
-      frdc-ds:
-        etag: 088b9682ac8de682031001
-        version_id: '1701154228570891'
-  - relpath: casuarina/20220418/183deg/result_NIR.tif
-    md5: 2c9cc4d48cf9316dea3a6f536fe5a3ac
-    size: 222016430
-    cloud:
-      frdc-ds:
-        etag: 089be4c1ab8de682031001
-        version_id: '1701154227515931'
-  - relpath: casuarina/20220418/183deg/result_Red.tif
-    md5: 73977a9d21760bbbcc8b42f79bcb4692
-    size: 226754875
-    cloud:
-      frdc-ds:
-        etag: 08e99287ac8de682031001
-        version_id: '1701154228652393'
-  - relpath: casuarina/20220418/183deg/result_RedEdge.tif
-    md5: 3f04518f4d8a35e2efdc3c3d6187860f
-    size: 223730363
-    cloud:
-      frdc-ds:
-        etag: 08ffbea1ac8de682031001
-        version_id: '1701154229084031'
-  - relpath: casuarina/20220418/183deg/segment.tif
-    md5: 830f7ca57c34ac3a0eb6a852cb272373
-    size: 26708
-    cloud:
-      frdc-ds:
-        etag: 08ccdd859c8de682031001
-        version_id: '1701154195074764'
-  - relpath: casuarina/20220418/93deg/dsm.tif
-    md5: 5fbd6841a0b7426bd01d4a3b68d06a9c
-    size: 36780878
-    cloud:
-      frdc-ds:
-        etag: 08f8f3c9a08de682031001
-        version_id: '1701154204580344'
-  - relpath: casuarina/20220418/93deg/gsddsm.tif
-    md5: ac659a3f17b2e21dc852a04af246906b
-    size: 91346
-    cloud:
-      frdc-ds:
-        etag: 08c798869c8de682031001
-        version_id: '1701154195082311'
-  - relpath: casuarina/20220418/93deg/result.jpg
-    md5: e0f493e7704cf377b4f41132313950d1
-    size: 13131131
-    cloud:
-      frdc-ds:
-        etag: 08bffae48191e682031001
-        version_id: '1701155213753663'
-  - relpath: casuarina/20220418/93deg/result.tif
-    md5: 83feb031787b457f5017db9acdebf625
-    size: 195394032
-    cloud:
-      frdc-ds:
-        etag: 088df3e1aa8de682031001
-        version_id: '1701154225944973'
-  - relpath: casuarina/20220418/93deg/result_Blue.tif
-    md5: d97ce2b5a44e896810e6401b4f5ab506
-    size: 220670499
-    cloud:
-      frdc-ds:
-        etag: 08d5d5b0b28de682031001
-        version_id: '1701154241915605'
-  - relpath: casuarina/20220418/93deg/result_Green.tif
-    md5: 40ef3a8c81ba28366ba47a1fa4989702
-    size: 223797748
-    cloud:
-      frdc-ds:
-        etag: 08d3ec8cac8de682031001
-        version_id: '1701154228745811'
-  - relpath: casuarina/20220418/93deg/result_NIR.tif
-    md5: a2ce084c7ba1c5f5a6b0b4a1dc93a98c
-    size: 219316999
-    cloud:
-      frdc-ds:
-        etag: 08f4b0fdab8de682031001
-        version_id: '1701154228492404'
-  - relpath: casuarina/20220418/93deg/result_Red.tif
-    md5: 65144fb2a827f6dd1723538afd375902
-    size: 224060322
-    cloud:
-      frdc-ds:
-        etag: 0885ce9fac8de682031001
-        version_id: '1701154229053189'
-  - relpath: casuarina/20220418/93deg/result_RedEdge.tif
-    md5: ceda32971f11a11af00a4f1838475e16
-    size: 221188044
-    cloud:
-      frdc-ds:
-        etag: 08f8dceaab8de682031001
-        version_id: '1701154228186744'
-  - relpath: casuarina/20220418/93deg/segment.tif
-    md5: ea46f1c799137aa0fd0256b20c5a66d6
-    size: 25383
-    cloud:
-      frdc-ds:
-        etag: 0881da859c8de682031001
-        version_id: '1701154195074305'
-  - relpath: chestnut_nature_park/20201218/bounds.csv
-    md5: d7043890368db04693865c2451c35a1f
-    size: 1408
-    cloud:
-      frdc-ds:
-        etag: 08e98f869c8de682031001
-        version_id: '1701154195081193'
-  - relpath: chestnut_nature_park/20201218/dsm.tif
-    md5: fbf608de495c51dace8bda86cadb4b65
-    size: 14482537
-    cloud:
-      frdc-ds:
-        etag: 08b8a1c79c8de682031001
-        version_id: '1701154196148408'
-  - relpath: chestnut_nature_park/20201218/result.jpg
-    md5: 91c1cff8671c332b20e3ca128431d6d7
-    size: 4780586
-    cloud:
-      frdc-ds:
-        etag: 08ddf0c49c8de682031001
-        version_id: '1701154196109405'
-  - relpath: chestnut_nature_park/20201218/result.tif
-    md5: d08c5b89a54b24ae85dd5d15e2a462fb
-    size: 80415617
-    cloud:
-      frdc-ds:
-        etag: 08fafec5a58de682031001
-        version_id: '1701154215001978'
-  - relpath: chestnut_nature_park/20201218/result_Blue.tif
-    md5: ad5eacd90476ad6a56111009f958a30b
-    size: 95205235
-    cloud:
-      frdc-ds:
-        etag: 08cebef79b8de682031001
-        version_id: '1701154194841422'
-  - relpath: chestnut_nature_park/20201218/result_Green.tif
-    md5: 5c85ec286f81edecaa5f2978086a6f79
-    size: 96849701
-    cloud:
-      frdc-ds:
-        etag: 08d2eff6a08de682031001
-        version_id: '1701154205317074'
-  - relpath: chestnut_nature_park/20201218/result_NIR.tif
-    md5: fa7df3dece555c289aea03c2c996195d
-    size: 94504684
-    cloud:
-      frdc-ds:
-        etag: 08b180c2a68de682031001
-        version_id: '1701154217033777'
-  - relpath: chestnut_nature_park/20201218/result_Red.tif
-    md5: 09b07ef8678e8f4ce058fd091760eab6
-    size: 96915726
-    cloud:
-      frdc-ds:
-        etag: 088cd0d0a18de682031001
-        version_id: '1701154206787596'
-  - relpath: chestnut_nature_park/20201218/result_RedEdge.tif
-    md5: 097c3c39629534dcdcb8f0b645ad9736
-    size: 95540119
-    cloud:
-      frdc-ds:
-        etag: 08ffa289a78de682031001
-        version_id: '1701154218201471'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/bounds.csv
-    md5: 58f03982df33a8b52c61e51daf6b450b
-    size: 1452
-    cloud:
-      frdc-ds:
-        etag: 08b2b8859c8de682031001
-        version_id: '1701154195070002'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/dsm.tif
-    md5: 041257e74edb3d9719debc3d9fe7d4dd
-    size: 20773786
-    cloud:
-      frdc-ds:
-        etag: 08f7b2809f8de682031001
-        version_id: '1701154201278839'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/gsddsm.tif
-    md5: 45b28f2f3735de83d65aea19e2697676
-    size: 45878
-    cloud:
-      frdc-ds:
-        etag: 08f691869c8de682031001
-        version_id: '1701154195081462'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result.jpg
-    md5: d012b232cc1faed2871ebf5150d20cc1
-    size: 6941116
-    cloud:
-      frdc-ds:
-        etag: 08cfbae38191e682031001
-        version_id: '1701155213729103'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result.tif
-    md5: 43541fa1f15171ba8548fb9b6ae77cfe
-    size: 103859274
-    cloud:
-      frdc-ds:
-        etag: 089b99c3a78de682031001
-        version_id: '1701154219150491'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result_Blue.tif
-    md5: 87bef8f7bff639951ffa452f6ef9bc3f
-    size: 117714429
-    cloud:
-      frdc-ds:
-        etag: 08d8b18ca88de682031001
-        version_id: '1701154220349656'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result_Green.tif
-    md5: c01de4a50b5caa01ace693e5191b3870
-    size: 119925274
-    cloud:
-      frdc-ds:
-        etag: 08bdfcbaa78de682031001
-        version_id: '1701154219015741'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result_NIR.tif
-    md5: 2d842ef0d2f43e5269c1fc456aeb746d
-    size: 117211078
-    cloud:
-      frdc-ds:
-        etag: 08fb9adaa78de682031001
-        version_id: '1701154219527547'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result_Red.tif
-    md5: 214d97f9eacf93ce29c6898858b7f146
-    size: 119913392
-    cloud:
-      frdc-ds:
-        etag: 08e5ecdda78de682031001
-        version_id: '1701154219587173'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/result_RedEdge.tif
-    md5: b45f71ffe2c14280100e22c23ba871ab
-    size: 118263239
-    cloud:
-      frdc-ds:
-        etag: 089798e6a88de682031001
-        version_id: '1701154221820951'
-  - relpath: chestnut_nature_park/20210510/90deg43m85pct255deg/segment.tif
-    md5: 86191f2ab6e7374ce98c83491ce43527
-    size: 10021
-    cloud:
-      frdc-ds:
-        etag: 08b5e5859c8de682031001
-        version_id: '1701154195075765'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/dsm.tif
-    md5: 99fa34f9ca8dc66d95b9b2fb144b334f
-    size: 10857218
-    cloud:
-      frdc-ds:
-        etag: 08dc84e09d8de682031001
-        version_id: '1701154198651484'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/gsddsm.tif
-    md5: 09f4143d1083c743f6a2bbed2dba5d81
-    size: 55570
-    cloud:
-      frdc-ds:
-        etag: 089e95869c8de682031001
-        version_id: '1701154195081886'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result.jpg
-    md5: cfc21b5bf466b57e888733f37d922017
-    size: 3243560
-    cloud:
-      frdc-ds:
-        etag: 08edc4db8191e682031001
-        version_id: '1701155213599341'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result.tif
-    md5: 6b99351bd16f05fafc2f96e2945ec094
-    size: 51407149
-    cloud:
-      frdc-ds:
-        etag: 08fca18da48de682031001
-        version_id: '1701154211975420'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result_Blue.tif
-    md5: c240b4e607af2cdadc3d4fc96181e005
-    size: 59362235
-    cloud:
-      frdc-ds:
-        etag: 08b3d484a58de682031001
-        version_id: '1701154213931571'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result_Green.tif
-    md5: 08d7b7e3e4823b0cf9c53692d6b55f5b
-    size: 60380606
-    cloud:
-      frdc-ds:
-        etag: 08ebe3a2a58de682031001
-        version_id: '1701154214425067'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result_NIR.tif
-    md5: ab3509fac188fe452d01957237181f31
-    size: 59034799
-    cloud:
-      frdc-ds:
-        etag: 0893bcfca48de682031001
-        version_id: '1701154213797395'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result_Red.tif
-    md5: 6b0531431f0d898aacda6334c10fca8a
-    size: 60369184
-    cloud:
-      frdc-ds:
-        etag: 08e8a58ea58de682031001
-        version_id: '1701154214089448'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/result_RedEdge.tif
-    md5: 75e67bc7c1b01e060c68062354192b8e
-    size: 59567305
-    cloud:
-      frdc-ds:
-        etag: 08f0dc91ad8de682031001
-        version_id: '1701154230922864'
-  - relpath: chestnut_nature_park/20210510/90deg60m84.5pct255deg/segment.tif
-    md5: 2b5856c859b44e54517b7891fd53bd60
-    size: 12784
-    cloud:
-      frdc-ds:
-        etag: 08838e869c8de682031001
-        version_id: '1701154195080963'
-  - relpath: chestnut_nature_park/20210510/Join/adding -90deg 60m data/cloud.las
-    md5: a4755ad17e0c0f2686a1fb9cacc712b7
-    size: 74248398
-    cloud:
-      frdc-ds:
-        etag: 0892daa1a48de682031001
-        version_id: '1701154212310290'
-  - relpath: chestnut_nature_park/20210510/Join/cloud.las
-    md5: 8ce9bccccab90a8a5c17ad5b3a982f0d
-    size: 61187376
-    cloud:
-      frdc-ds:
-        etag: 08fda5a8a58de682031001
-        version_id: '1701154214515453'
diff --git a/src/.gitignore b/src/.gitignore
index 57b22671..d3514034 100644
--- a/src/.gitignore
+++ b/src/.gitignore
@@ -1,2 +1,3 @@
 label-studio/
 !label-studio/docker-compose.yml
+!label-studio/dump.sh
diff --git a/src/frdc/conf.py b/src/frdc/conf.py
index 89986988..0d32eb45 100644
--- a/src/frdc/conf.py
+++ b/src/frdc/conf.py
@@ -56,9 +56,12 @@
 except Exception as e:
     logger.warning(
         "Could not connect to GCS. Will not be able to download files. "
+        "Check that you've (1) Installed the GCS CLI and (2) Set up the"
+        "ADC with `gcloud auth application-default login`. "
         "GCS_CLIENT will be None."
     )
     GCS_CLIENT = None
+    GCS_BUCKET = None
 
 try:
     logger.info("Connecting to Label Studio...")
@@ -68,6 +71,17 @@
         api_key=LABEL_STUDIO_API_KEY,
     )
     logger.info("Connected to Label Studio.")
+    try:
+        logger.info("Attempting to Get Label Studio Project...")
+        LABEL_STUDIO_CLIENT.get_project(1)
+    except requests.exceptions.HTTPError:
+        logger.warning(
+            f"Could not get main annotation project. "
+            f"Pulling annotations may not work. "
+            f"It's possible that your API Key is incorrect, "
+            f"or somehow your .netrc is preventing you from "
+            f"accessing the project. "
+        )
 except requests.exceptions.ConnectionError:
     logger.warning(
         f"Could not connect to Label Studio at {LABEL_STUDIO_URL}. "
diff --git a/src/frdc/evaluate/__init__.py b/src/frdc/evaluate/__init__.py
index 48354a4b..8b137891 100644
--- a/src/frdc/evaluate/__init__.py
+++ b/src/frdc/evaluate/__init__.py
@@ -1,3 +1 @@
-from .evaluate import dummy_evaluate
 
-__all__ = ["dummy_evaluate"]
diff --git a/src/frdc/evaluate/evaluate.py b/src/frdc/evaluate/evaluate.py
deleted file mode 100644
index a0ccfbed..00000000
--- a/src/frdc/evaluate/evaluate.py
+++ /dev/null
@@ -1,31 +0,0 @@
-from typing import Callable
-
-import numpy as np
-from sklearn.base import ClassifierMixin
-
-
-def dummy_evaluate(
-    *,
-    feature_extraction: Callable[[np.ndarray], np.ndarray],
-    classifier: ClassifierMixin,
-    X_test: np.ndarray,
-    y_test: np.ndarray,
-) -> float:
-    """Dummy Evaluation function.
-
-    Notes:
-        This is obviously not final. This is just a placeholder to get the
-         pipeline working.
-
-    Args:
-        feature_extraction: The feature extraction function.
-        classifier: The classifier.
-        X_test: X_test is the test image numpy array of shape (N, H, W, C).
-        y_test: y_test is the test class label a numpy array of shape (N,).
-
-    Returns:
-        The score of the model.
-    """
-    # TODO: Replace this with how the model scores
-
-    return classifier.score(feature_extraction(X_test), y_test)
diff --git a/src/frdc/load/__init__.py b/src/frdc/load/__init__.py
index 06860a70..e69de29b 100644
--- a/src/frdc/load/__init__.py
+++ b/src/frdc/load/__init__.py
@@ -1,3 +0,0 @@
-from .dataset import FRDCDataset
-
-__all__ = ["FRDCDataset"]
diff --git a/src/frdc/load/dataset.py b/src/frdc/load/dataset.py
index b3654cca..466aad93 100644
--- a/src/frdc/load/dataset.py
+++ b/src/frdc/load/dataset.py
@@ -8,7 +8,6 @@
 
 import numpy as np
 import pandas as pd
-import torch
 from PIL import Image
 from torch.utils.data import Dataset, ConcatDataset
 
@@ -27,6 +26,44 @@
 logger = logging.getLogger(__name__)
 
 
+class FRDCConcatDataset(ConcatDataset):
+    """ConcatDataset for FRDCDataset.
+
+    Notes:
+        This handles concatenating the targets when you add two datasets
+        together, furthermore, implements the addition operator to
+        simplify the syntax.
+
+    Examples:
+        If you have two datasets, ds1 and ds2, you can concatenate them::
+
+            ds = ds1 + ds2
+
+        `ds` will be a FRDCConcatDataset, which is a subclass of ConcatDataset.
+
+        You can further add to a concatenated dataset::
+
+            ds = ds1 + ds2
+            ds = ds + ds3
+
+        Finallu, all concatenated datasets have the `targets` property, which
+        is a list of all the targets in the datasets::
+
+            (ds1 + ds2).targets == ds1.targets + ds2.targets
+    """
+
+    def __init__(self, datasets: list[FRDCDataset]):
+        super().__init__(datasets)
+        self.datasets: list[FRDCDataset] = datasets
+
+    @property
+    def targets(self):
+        return [t for ds in self.datasets for t in ds.targets]
+
+    def __add__(self, other: FRDCDataset) -> FRDCConcatDataset:
+        return FRDCConcatDataset([*self.datasets, other])
+
+
 @dataclass
 class FRDCDataset(Dataset):
     def __init__(
@@ -40,6 +77,17 @@ def __init__(
     ):
         """Initializes the FRDC Dataset.
 
+        Notes:
+            We recommend to check FRDCDatasetPreset if you want to use a
+            pre-defined dataset.
+
+            You can concatenate datasets using the addition operator, e.g.::
+
+                ds = FRDCDataset(...) + FRDCDataset(...)
+
+            This will return a FRDCConcatDataset, see FRDCConcatDataset for
+            more information.
+
         Args:
             site: The site of the dataset, e.g. "chestnut_nature_park".
             date: The date of the dataset, e.g. "20201218".
@@ -47,19 +95,18 @@ def __init__(
             transform: The transform to apply to each segment.
             target_transform: The transform to apply to each label.
             use_legacy_bounds: Whether to use the legacy bounds.csv file.
+                This will automatically be set to True if LABEL_STUDIO_CLIENT
+                is None, which happens when Label Studio cannot be connected
+                to.
         """
         self.site = site
         self.date = date
         self.version = version
 
         self.ar, self.order = self.get_ar_bands()
+        self.targets = None
 
         if use_legacy_bounds or (LABEL_STUDIO_CLIENT is None):
-            logger.warning(
-                "Using legacy bounds.csv file for dataset."
-                "This is pending to be deprecated in favour of pulling "
-                "annotations from Label Studio."
-            )
             bounds, self.targets = self.get_bounds_and_labels()
             self.ar_segments = extract_segments_from_bounds(self.ar, bounds)
         else:
@@ -83,37 +130,9 @@ def __getitem__(self, idx):
             else self.targets[idx],
         )
 
-    @staticmethod
-    def _load_debug_dataset(resize: int = 299) -> FRDCDataset:
-        """Loads a debug dataset from Google Cloud Storage.
-
-        Returns:
-            A dictionary of the dataset, with keys as the filenames and values
-            as the images.
-        """
-        from torchvision.transforms.v2 import (
-            Compose,
-            ToImage,
-            ToDtype,
-            Resize,
-        )
-
-        return FRDCDataset(
-            site="DEBUG",
-            date="0",
-            version=None,
-            transform=Compose(
-                [
-                    ToImage(),
-                    ToDtype(torch.float32),
-                    Resize((resize, resize)),
-                ]
-            ),
-            target_transform=None,
-        )
-
     @property
     def dataset_dir(self):
+        """Returns the path format of the dataset."""
         return Path(
             f"{self.site}/{self.date}/"
             f"{self.version + '/' if self.version else ''}"
@@ -215,6 +234,11 @@ def get_bounds_and_labels(
             A tuple of (bounds, labels), where bounds is a list of
             (x0, y0, x1, y1) and labels is a list of labels.
         """
+        logger.warning(
+            "Using legacy bounds.csv file for dataset."
+            "This is pending to be deprecated in favour of pulling "
+            "annotations from Label Studio."
+        )
         fp = download(fp=self.dataset_dir / file_name)
         df = pd.read_csv(fp)
         return (
@@ -223,6 +247,7 @@ def get_bounds_and_labels(
         )
 
     def get_polybounds_and_labels(self):
+        """Gets the bounds and labels from Label Studio."""
         return get_task(
             Path(f"{self.dataset_dir}/result.jpg")
         ).get_bounds_and_labels()
@@ -246,33 +271,29 @@ def _load_image(path: Path | str) -> np.ndarray:
         ar = np.asarray(im)
         return np.expand_dims(ar, axis=-1) if ar.ndim == 2 else ar
 
+    def __add__(self, other) -> FRDCConcatDataset:
+        return FRDCConcatDataset([self, other])
+
 
-# TODO: Kind of hacky, the unlabelled dataset should somehow come from the
-#       labelled dataset by filtering out the unknown labels. But we'll
-#       figure out this later when we do get unlabelled data.
-#       I'm thinking some API that's like
-#       FRDCDataset.filter_labels(...) -> FRDCSubset, FRDCSubset
-#       It could be more intuitive if it returns FRDCDataset, so we don't have
-#       to implement another class.
 class FRDCUnlabelledDataset(FRDCDataset):
+    """An implementation of FRDCDataset that masks away the labels.
+
+    Notes:
+        If you already have a FRDCDataset, you can simply set __class__ to
+        FRDCUnlabelledDataset to achieve the same behaviour::
+
+            ds.__class__ = FRDCUnlabelledDataset
+
+        This will replace the __getitem__ method with the one below.
+
+        However, it's also perfectly fine to initialize this directly::
+
+            ds_unl = FRDCUnlabelledDataset(...)
+    """
+
     def __getitem__(self, item):
         return (
             self.transform(self.ar_segments[item])
             if self.transform
             else self.ar_segments[item]
         )
-
-
-# This is not yet used much as we don't have sufficient training data.
-class FRDCConcatDataset(ConcatDataset):
-    def __init__(self, datasets: list[FRDCDataset]):
-        super().__init__(datasets)
-        self.datasets = datasets
-
-    def __getitem__(self, idx):
-        x, y = super().__getitem__(idx)
-        return x, y
-
-    @property
-    def targets(self):
-        return [t for ds in self.datasets for t in ds.targets]
diff --git a/src/frdc/load/label_studio.py b/src/frdc/load/label_studio.py
index b8287ff3..6383cfe4 100644
--- a/src/frdc/load/label_studio.py
+++ b/src/frdc/load/label_studio.py
@@ -8,16 +8,6 @@
 
 from frdc.conf import LABEL_STUDIO_CLIENT
 
-# try:
-#     client.check_connection()
-# except ConnectionError:
-#     raise ConnectionError(
-#         f"Could not connect to Label Studio at {LABEL_STUDIO_URL}. "
-#         "This uses Label Studio's check_connection() method,"
-#         "which performs retries. "
-#         "Use utils.is_label_studio_up() as a faster alternative to check if "
-#         "Label Studio is up."
-#     )
 
 logger = logging.getLogger(__name__)
 
diff --git a/src/frdc/load/preset.py b/src/frdc/load/preset.py
new file mode 100644
index 00000000..4f892349
--- /dev/null
+++ b/src/frdc/load/preset.py
@@ -0,0 +1,159 @@
+from __future__ import annotations
+
+import logging
+from dataclasses import dataclass
+from typing import Callable, Any
+
+import numpy as np
+import torch
+from torchvision.transforms.v2 import (
+    Compose,
+    ToImage,
+    ToDtype,
+    Resize,
+)
+
+from frdc.load.dataset import FRDCDataset, FRDCUnlabelledDataset
+
+logger = logging.getLogger(__name__)
+
+
+# This curries the FRDCDataset class, so that we can shorthand the preset
+# definitions.
+@dataclass
+class FRDCDatasetPartial:
+    """Partial class for FRDCDataset.
+
+    Notes:
+        This is used internally by FRDCDatasetPreset to define the presets
+        in a more concise manner::
+
+            # Instead of
+            lambda *args, **kwargs:
+                FRDCDataset("chestnut_nature_park", "20201218", None,
+                            *args, **kwargs)
+
+            # Using partial, we can do this instead
+            FRDCDatasetPartial("chestnut_nature_park", "20201218", None)(
+                *args, **kwargs
+            )
+
+        See FRDCDatasetPreset for usage.
+    """
+
+    site: str
+    date: str
+    version: str | None
+
+    def __call__(
+        self,
+        transform: Callable[[list[np.ndarray]], Any] = None,
+        target_transform: Callable[[list[str]], list[str]] = None,
+        use_legacy_bounds: bool = False,
+    ):
+        """Alias for labelled()."""
+        return self.labelled(
+            transform,
+            target_transform,
+            use_legacy_bounds,
+        )
+
+    def labelled(
+        self,
+        transform: Callable[[list[np.ndarray]], Any] = None,
+        target_transform: Callable[[list[str]], list[str]] = None,
+        use_legacy_bounds: bool = False,
+    ):
+        """Returns the Labelled Dataset."""
+        return FRDCDataset(
+            self.site,
+            self.date,
+            self.version,
+            transform,
+            target_transform,
+            use_legacy_bounds,
+        )
+
+    def unlabelled(
+        self,
+        transform: Callable[[list[np.ndarray]], Any] = None,
+        target_transform: Callable[[list[str]], list[str]] = None,
+        use_legacy_bounds: bool = False,
+    ):
+        """Returns the Unlabelled Dataset.
+
+        Notes:
+            This simply masks away the labels during __getitem__.
+            The same behaviour can be achieved by setting __class__ to
+            FRDCUnlabelledDataset, but this is a more convenient way to do so.
+        """
+        return FRDCUnlabelledDataset(
+            self.site,
+            self.date,
+            self.version,
+            transform,
+            target_transform,
+            use_legacy_bounds,
+        )
+
+
+@dataclass
+class FRDCDatasetPreset:
+    """Presets for the FRDCDataset.
+
+    Examples:
+        Each variable is a preset for the FRDCDataset.
+
+        You can use it like this::
+
+            FRDCDatasetPreset.chestnut_20201218()
+
+        Which returns a FRDCDataset.
+
+        Furthermore, if you're interested in the unlabelled dataset, you can
+        use::
+
+            FRDCDatasetPreset.chestnut_20201218.unlabelled()
+
+        Which returns a FRDCUnlabelledDataset.
+
+        If you'd like to keep the syntax consistent for labelled and unlabelled
+        datasets, you can use::
+
+            FRDCDatasetPreset.chestnut_20201218.labelled()
+            FRDCDatasetPreset.chestnut_20201218.unlabelled()
+
+        The `labelled` method is simply an alias for the `__call__` method.
+
+        The DEBUG dataset is a special dataset that is used for debugging,
+        which pulls from GCS a small cropped image and dummy label + bounds.
+
+    """
+
+    chestnut_20201218 = FRDCDatasetPartial(
+        "chestnut_nature_park", "20201218", None
+    )
+    chestnut_20210510_43m = FRDCDatasetPartial(
+        "chestnut_nature_park", "20210510", "90deg43m85pct255deg"
+    )
+    chestnut_20210510_60m = FRDCDatasetPartial(
+        "chestnut_nature_park", "20210510", "90deg60m84.5pct255deg"
+    )
+    casuarina_20220418_183deg = FRDCDatasetPartial(
+        "casuarina_nature_park", "20220418", "183deg"
+    )
+    casuarina_20220418_93deg = FRDCDatasetPartial(
+        "casuarina_nature_park", "20220418", "93deg"
+    )
+    DEBUG = lambda resize=299: FRDCDatasetPartial(
+        site="DEBUG", date="0", version=None
+    )(
+        transform=Compose(
+            [
+                ToImage(),
+                ToDtype(torch.float32),
+                Resize((resize, resize)),
+            ]
+        ),
+        target_transform=None,
+    )
diff --git a/src/frdc/train/frdc_datamodule.py b/src/frdc/train/frdc_datamodule.py
index 6138c7e5..5e4e6dbd 100644
--- a/src/frdc/train/frdc_datamodule.py
+++ b/src/frdc/train/frdc_datamodule.py
@@ -1,11 +1,13 @@
 from __future__ import annotations
 
 from dataclasses import dataclass
+from typing import Literal
 
 from lightning import LightningDataModule
-from torch.utils.data import DataLoader, RandomSampler
+from torch.utils.data import DataLoader, RandomSampler, Sampler
 
-from frdc.load import FRDCDataset
+from frdc.load.dataset import FRDCDataset, FRDCUnlabelledDataset
+from frdc.train.stratified_sampling import RandomStratifiedSampler
 
 
 @dataclass
@@ -14,34 +16,39 @@ class FRDCDataModule(LightningDataModule):
 
     Notes:
         This is a special datamodule for semi-supervised learning, which
-        requires two dataloaders for the labelled and unlabelled datasets.
-        It can also be used for supervised learning, by passing in None for
-        the unlabelled dataset.
+        can accept an optional dataloaders for an unlabelled dataset.
+
+        Without an unsupervised dataset it can be used for supervised learning,
+        by passing in None for the unlabelled dataset.
 
         If you're using our MixMatch Module, using None for the unlabelled
         dataset will skip the MixMatch. However, note that this is not
         equivalent to passing the Labelled set as unlabelled as well.
 
-        For example:
-        >>> FRDCSSLDataModule(
-        ...     train_lab_ds=train_lab_ds,
-        ...     train_unl_ds=train_lab_ds,
-        ...     ...
-        ... )
+        For example::
+
+            FRDCDataModule(
+                train_lab_ds=train_lab_ds,
+                train_unl_ds=train_lab_ds,
+                ...
+            )
+
+        Does not have the same performance as::
 
-        Does not have the same performance as:
-        >>> FRDCSSLDataModule(
-        ...     train_lab_ds=train_lab_ds,
-        ...     train_unl_ds=None,
-        ...     ...
-        ... )
+            FRDCDataModule(
+                train_lab_ds=train_lab_ds,
+                train_unl_ds=None,
+                ...
+            )
 
         As partially, some samples in MixMatch uses the unlabelled loss.
 
     Args:
         train_lab_ds: The labelled training dataset.
         train_unl_ds: The unlabelled training dataset. Can be None, which will
-            default to a DataModule suitable for supervised learning.
+            default to a DataModule suitable for supervised learning. If
+            train_unl_ds is a FRDCDataset, it will be converted to a
+            FRDCUnlabelledDataset, which simply masks away the labels.
         val_ds: The validation dataset.
         batch_size: The batch size to use for the dataloaders.
         train_iters: The number of iterations to run for the labelled training
@@ -52,34 +59,43 @@ class FRDCDataModule(LightningDataModule):
 
     train_lab_ds: FRDCDataset
     val_ds: FRDCDataset
-    train_unl_ds: FRDCDataset | None = None
+    train_unl_ds: FRDCDataset | FRDCUnlabelledDataset | None = None
     batch_size: int = 4
     train_iters: int = 100
     val_iters: int = 100
+    sampling_strategy: Literal["stratified", "random"] = "stratified"
 
     def __post_init__(self):
         super().__init__()
 
+        if isinstance(self.train_unl_ds, FRDCDataset):
+            self.train_unl_ds.__class__ = FRDCUnlabelledDataset
+
     def train_dataloader(self):
         num_samples = self.batch_size * self.train_iters
+        if self.sampling_strategy == "stratified":
+            sampler = lambda ds: RandomStratifiedSampler(
+                ds.targets, num_samples=num_samples, replacement=True
+            )
+        elif self.sampling_strategy == "random":
+            sampler = lambda ds: RandomSampler(
+                ds, num_samples=num_samples, replacement=True
+            )
+        else:
+            raise ValueError(
+                f"Invalid sampling strategy: {self.sampling_strategy}"
+            )
+
         lab_dl = DataLoader(
             self.train_lab_ds,
             batch_size=self.batch_size,
-            sampler=RandomSampler(
-                self.train_lab_ds,
-                num_samples=num_samples,
-                replacement=False,
-            ),
+            sampler=sampler(self.train_lab_ds),
         )
         unl_dl = (
             DataLoader(
                 self.train_unl_ds,
                 batch_size=self.batch_size,
-                sampler=RandomSampler(
-                    self.train_unl_ds,
-                    num_samples=self.batch_size * self.train_iters,
-                    replacement=False,
-                ),
+                sampler=sampler(self.train_unl_ds),
             )
             if self.train_unl_ds is not None
             # This is a hacky way to create an empty dataloader.
@@ -91,7 +107,6 @@ def train_dataloader(self):
                 sampler=RandomSampler(
                     empty,
                     num_samples=num_samples,
-                    replacement=False,
                 ),
             )
         )
diff --git a/src/frdc/train/mixmatch_module.py b/src/frdc/train/mixmatch_module.py
index 194928ad..9e3af191 100644
--- a/src/frdc/train/mixmatch_module.py
+++ b/src/frdc/train/mixmatch_module.py
@@ -8,6 +8,7 @@
 import torch.nn.functional as F
 import torch.nn.parallel
 import torch.nn.parallel
+import wandb
 from lightning import LightningModule
 from sklearn.preprocessing import StandardScaler, OrdinalEncoder
 from torch.nn.functional import one_hot
@@ -52,6 +53,7 @@ def __init__(
         self.sharpen_temp = sharpen_temp
         self.mix_beta_alpha = mix_beta_alpha
         self.save_hyperparameters()
+        self.lbl_logger = WandBLabelLogger()
 
     @property
     @abstractmethod
@@ -150,10 +152,16 @@ def progress(self):
         ) / self.trainer.max_epochs
 
     def training_step(self, batch, batch_idx):
-        # Progress is a linear ramp from 0 to 1 over the course of training.
         (x_lbl, y_lbl), x_unls = batch
+        self.lbl_logger(
+            self.logger.experiment,
+            "Input Y Label",
+            y_lbl,
+            flush_every=10,
+            num_bins=self.n_classes,
+        )
 
-        y_lbl = one_hot(y_lbl.long(), num_classes=self.n_classes)
+        y_lbl_ohe = one_hot(y_lbl.long(), num_classes=self.n_classes)
 
         # If x_unls is Truthy, then we are using MixMatch.
         # Otherwise, we are just using supervised learning.
@@ -164,7 +172,7 @@ def training_step(self, batch, batch_idx):
                 y_unl = self.sharpen(y_unl, self.sharpen_temp)
 
             x = torch.cat([x_lbl, *x_unls], dim=0)
-            y = torch.cat([y_lbl, *(y_unl,) * len(x_unls)], dim=0)
+            y = torch.cat([y_lbl_ohe, *(y_unl,) * len(x_unls)], dim=0)
             x_mix, y_mix = self.mix_up(x, y, self.mix_beta_alpha)
 
             # This had interleaving, but it was removed as it's not
@@ -177,7 +185,21 @@ def training_step(self, batch, batch_idx):
             y_mix_unl = y_mix[batch_size:]
 
             loss_lbl = self.loss_lbl(y_mix_lbl_pred, y_mix_lbl)
+            self.lbl_logger(
+                self.logger.experiment,
+                "Labelled Y Pred",
+                torch.argmax(y_mix_lbl_pred, dim=1),
+                flush_every=10,
+                num_bins=self.n_classes,
+            )
             loss_unl = self.loss_unl(y_mix_unl_pred, y_mix_unl)
+            self.lbl_logger(
+                self.logger.experiment,
+                "Unlabelled Y Pred",
+                torch.argmax(y_mix_unl_pred, dim=1),
+                flush_every=10,
+                num_bins=self.n_classes,
+            )
             loss_unl_scale = self.loss_unl_scaler(progress=self.progress)
 
             loss = loss_lbl + loss_unl * loss_unl_scale
@@ -188,7 +210,7 @@ def training_step(self, batch, batch_idx):
         else:
             # This route implies that we are just using supervised learning
             y_pred = self(x_lbl)
-            loss = self.loss_lbl(y_pred, y_lbl.float())
+            loss = self.loss_lbl(y_pred, y_lbl_ohe.float())
 
         self.log("train_loss", loss)
         return loss
@@ -201,7 +223,21 @@ def on_after_backward(self) -> None:
 
     def validation_step(self, batch, batch_idx):
         x, y = batch
+        self.lbl_logger(
+            self.logger.experiment,
+            "Val Input Y Label",
+            y,
+            flush_every=1,
+            num_bins=self.n_classes,
+        )
         y_pred = self.ema_model(x)
+        self.lbl_logger(
+            self.logger.experiment,
+            "Val Pred Y Label",
+            torch.argmax(y_pred, dim=1),
+            flush_every=1,
+            num_bins=self.n_classes,
+        )
         loss = F.cross_entropy(y_pred, y.long())
 
         acc = accuracy(
@@ -241,72 +277,98 @@ def on_before_batch_transfer(self, batch: Any, dataloader_idx: int) -> Any:
         We leverage this to do some preprocessing on the data.
         Namely, we use the StandardScaler and OrdinalEncoder to transform the
         data.
-        """
 
-        # TODO: ngl, this is pretty chunky.
-        #       It works, but it's not very pretty.
-        if self.training:
-            (x_lab, y), x_unl = batch
-            xs = [x_lab, *x_unl]
+        Notes:
+            PyTorch Lightning may complain about this being on the Module
+            instead of the DataModule. However, this is intentional as we
+            want to export the model alongside the transformations.
+        """
 
-            b, c, h, w = x_lab.shape
+        def x_trans_fn(x):
+            # Standard Scaler only accepts (n_samples, n_features),
+            # so we need to do some fancy reshaping.
+            # Note that moving dimensions then reshaping is different from just
+            # reshaping!
 
             # Move Channel to the last dimension then transform
-            xs_ss: list[np.ndarray] = [
-                self.x_scaler.transform(x.permute(0, 2, 3, 1).reshape(-1, c))
-                for x in xs
-            ]
+            # B x C x H x W -> B x H x W x C
+            b, c, h, w = x.shape
+            x_ss = self.x_scaler.transform(
+                x.permute(0, 2, 3, 1).reshape(-1, c)
+            )
 
             # Move Channel back to the second dimension
-            xs_: list[torch.Tensor] = [
+            # B x H x W x C -> B x C x H x W
+            return (
                 torch.from_numpy(x_ss.reshape(b, h, w, c))
                 .permute(0, 3, 1, 2)
                 .float()
-                for x_ss in xs_ss
-            ]
+            )
 
-            y: tuple[str]
-            y_: torch.Tensor = torch.from_numpy(
+        def y_trans_fn(y):
+            return torch.from_numpy(
                 self.y_encoder.transform(np.array(y).reshape(-1, 1)).squeeze()
             )
 
-            # Ordinal Encoders can return a np.nan if the value is not in the
-            # categories. We will remove that from the batch.
-            x_ = xs_[0][~torch.isnan(y_)]
-            y_ = y_[~torch.isnan(y_)]
+        # We need to handle the train and val dataloaders differently.
+        # For training, the unlabelled data is returned while for validation,
+        # the unlabelled data is just omitted.
+        if self.training:
+            (x_lab, y), x_unl = batch
+        else:
+            x_lab, y = batch
+            x_unl = []
 
-            return (x_, y_.long()), xs_[1:]
+        x_lab_trans = x_trans_fn(x_lab)
+        y_trans = y_trans_fn(y)
+        x_unl_trans = [x_trans_fn(x) for x in x_unl]
 
-        else:
-            x, y = batch
+        # Remove nan values from the batch
+        #   Ordinal Encoders can return a np.nan if the value is not in the
+        #   categories. We will remove that from the batch.
+        nan = ~torch.isnan(y_trans)
+        x_lab_trans = x_lab_trans[nan]
+        x_unl_trans = [x[nan] for x in x_unl_trans]
+        y_trans = y_trans[nan]
 
-            x: torch.Tensor
-            b, c, h, w = x.shape
+        if self.training:
+            return (x_lab_trans, y_trans.long()), x_unl_trans
+        else:
+            return x_lab_trans, y_trans.long()
 
-            # Standard Scaler only accepts (n_samples, n_features),
-            # so we need to do some fancy reshaping.
-            # Note that moving dimensions then reshaping is different from just
-            # reshaping!
-            # Move Channel to the last dimension then transform
-            x_ss: np.ndarray = self.x_scaler.transform(
-                x.permute(0, 2, 3, 1).reshape(-1, c)
-            )
 
-            # Move Channel back to the second dimension
-            x_: torch.Tensor = (
-                torch.from_numpy(x_ss.reshape(b, h, w, c))
-                .permute(0, 3, 1, 2)
-                .float()
-            )
+class WandBLabelLogger(dict):
+    """Logger to log y labels to WandB"""
 
-            y: tuple[str]
-            y_: torch.Tensor = torch.from_numpy(
-                self.y_encoder.transform(np.array(y).reshape(-1, 1)).squeeze()
-            )
+    def __call__(
+        self,
+        logger: wandb.sdk.wandb_run.Run,
+        key: str,
+        value: torch.Tensor,
+        num_bins: int,
+        flush_every: int = 10,
+    ):
+        """Log the labels to WandB
 
-            # Ordinal Encoders can return a np.nan if the value is not in the
-            # categories. We will remove that from the batch.
-            x_ = x_[~torch.isnan(y_)]
-            y_ = y_[~torch.isnan(y_)]
+        Args:
+            logger: The W&B logger. Accessible through `self.logger.experiment`
+            key: The key to log the labels under.
+            value: The labels to log.
+            flush_every: How often to flush the labels to WandB.
 
-            return x_, y_.long()
+        """
+        if key not in self.keys():
+            self[key] = [value]
+        else:
+            self[key].append(value)
+
+        if len(self[key]) % flush_every == 0:
+            logger.log(
+                {
+                    key: wandb.Histogram(
+                        torch.flatten(value).detach().cpu().tolist(),
+                        num_bins=num_bins,
+                    )
+                }
+            )
+            self[key] = []
diff --git a/src/frdc/train/stratified_sampling.py b/src/frdc/train/stratified_sampling.py
new file mode 100644
index 00000000..dd17762c
--- /dev/null
+++ b/src/frdc/train/stratified_sampling.py
@@ -0,0 +1,65 @@
+from __future__ import annotations
+
+from typing import Iterator, Any, Sequence
+
+import pandas as pd
+import torch
+from sklearn.preprocessing import LabelEncoder
+from torch.utils.data import Sampler
+
+
+class RandomStratifiedSampler(Sampler[int]):
+    def __init__(
+        self,
+        targets: Sequence[Any],
+        num_samples: int | None = None,
+        replacement: bool = True,
+    ) -> None:
+        """Stratified sampling from a dataset, such that each class is
+        sampled with equal probability.
+
+        Examples:
+            Use this with DataLoader to sample from a dataset in a stratified
+            fashion. For example::
+
+                ds = TensorDataset(...)
+                dl = DataLoader(
+                    ds,
+                    batch_size=...,
+                    sampler=RandomStratifiedSampler(),
+                )
+
+            This will use the targets' frequency as the inverse probability
+            for sampling. For example, if the targets are [0, 0, 1, 2],
+            then the probability of sampling the
+
+        Args:
+            targets: The targets to stratify by. Must be integers.
+            num_samples: The number of samples to draw. If None, the
+                number of samples is equal to the length of the dataset.
+        """
+        super().__init__()
+
+        # Given targets [0, 0, 1]
+        # bincount = [2, 1]
+        # 1 / bincount = [0.5, 1]
+        # 1 / bincount / len(bincount) = [0.25, 0.5]
+        # The indexing then just projects it to the original targets.
+        targets_lab = torch.tensor(LabelEncoder().fit_transform(targets))
+        self.target_probs: torch.Tensor = (
+            1 / (bincount := torch.bincount(targets_lab)) / len(bincount)
+        )[targets_lab]
+
+        self.num_samples = num_samples if num_samples else len(targets)
+        self.replacement = replacement
+
+    def __len__(self) -> int:
+        return self.num_samples
+
+    def __iter__(self) -> Iterator[int]:
+        """This should be a generator that yields indices from the dataset."""
+        yield from torch.multinomial(
+            self.target_probs,
+            num_samples=self.num_samples,
+            replacement=self.replacement,
+        )
diff --git a/src/frdc/utils/training.py b/src/frdc/utils/training.py
new file mode 100644
index 00000000..d8130b3a
--- /dev/null
+++ b/src/frdc/utils/training.py
@@ -0,0 +1,67 @@
+from __future__ import annotations
+from pathlib import Path
+
+import lightning as pl
+import numpy as np
+from matplotlib import pyplot as plt
+from seaborn import heatmap
+from sklearn.metrics import confusion_matrix
+from torch.utils.data import DataLoader
+
+from frdc.load.dataset import FRDCDataset
+
+
+def get_latest_ckpt_path(search_dir: Path, extention: str = "ckpt"):
+    # This fetches all possible checkpoints and gets the latest one
+    return sorted(
+        search_dir.glob(f"**/*.{extention}"),
+        key=lambda x: x.stat().st_mtime_ns,
+    )[-1]
+
+
+def plot_confusion_matrix(
+    y_trues, y_preds, labels
+) -> tuple[plt.Figure, plt.Axes]:
+    # Plot the confusion matrix
+    cm = confusion_matrix(y_trues, y_preds)
+
+    fig, ax = plt.subplots(figsize=(10, 10))
+
+    heatmap(
+        cm,
+        annot=True,
+        xticklabels=labels,
+        yticklabels=labels,
+        cbar=False,
+        ax=ax,
+    )
+
+    fig.tight_layout(pad=3)
+    ax.set_xlabel("Predicted Label")
+    ax.set_ylabel("True Label")
+
+    return fig, ax
+
+
+def predict(
+    ds: FRDCDataset,
+    model_cls: type[pl.LightningModule],
+    ckpt_pth: Path | str | None = None,
+) -> tuple[np.ndarray, np.ndarray]:
+    m = model_cls.load_from_checkpoint(ckpt_pth)
+    # Make predictions
+    trainer = pl.Trainer(logger=False)
+    pred = trainer.predict(m, dataloaders=DataLoader(ds, batch_size=32))
+
+    y_preds = []
+    y_trues = []
+    for y_true, y_pred in pred:
+        y_preds.append(y_pred)
+        y_trues.append(y_true)
+    y_trues = np.concatenate(y_trues)
+    y_preds = np.concatenate(y_preds)
+    return y_trues, y_preds
+
+
+def accuracy(y_trues, y_preds) -> float:
+    return (y_trues == y_preds).mean()
diff --git a/src/label-studio/docker-compose.yml b/src/label-studio/docker-compose.yml
index 4a6d909f..9340fb8b 100644
--- a/src/label-studio/docker-compose.yml
+++ b/src/label-studio/docker-compose.yml
@@ -67,6 +67,7 @@ services:
       - POSTGRES_HOST_AUTH_METHOD=trust
     volumes:
       - ${POSTGRES_DATA_DIR:-./postgres-data}:/var/lib/postgresql/data
+      - ${POSTGRES_DATA_DIR:-./postgres-backups}:/var/lib/postgresql/backups
       - ./deploy/pgsql/certs:/var/lib/postgresql/certs:ro
     networks:
       - label-studio
diff --git a/src/label-studio/dump.sh b/src/label-studio/dump.sh
new file mode 100644
index 00000000..d651f42e
--- /dev/null
+++ b/src/label-studio/dump.sh
@@ -0,0 +1,16 @@
+echo "Creating backups directory..."
+docker exec label-studio-db-1 sh -c "if [ ! -d \"/var/lib/postgresql/backups/\" ]; then mkdir -p \"/var/lib/postgresql/backups/\"; fi"
+
+echo "Checking if label-studio-db-1 is running..."
+docker exec label-studio-db-1 sh -c "pg_isready -U postgres"
+
+if [ $? -ne 0 ]; then
+    echo "label-studio-db-1 is not running. Exiting..."
+    exit 1
+fi
+
+echo "Dumping database... to /var/lib/postgresql/backups/"
+docker exec label-studio-db-1 sh -c "pg_dump -Fc -U postgres -d postgres -f \"/var/lib/postgresql/backups/$(date +'%d-%m-%Y_%HH%MM%SS').backup\""
+
+echo "Dumping database in SQL format... to /var/lib/postgresql/backups/"
+docker exec label-studio-db-1 sh -c "pg_dump -U postgres -d postgres -f \"/var/lib/postgresql/backups/$(date +'%d-%m-%Y_%HH%MM%SS').sql\""
diff --git a/tests/conftest.py b/tests/conftest.py
index 1e9d84bd..b7bf6357 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -1,12 +1,13 @@
 import numpy as np
 import pytest
 
-from frdc.load import FRDCDataset
+from frdc.load.dataset import FRDCDataset
+from frdc.load.preset import FRDCDatasetPreset
 
 
 @pytest.fixture(scope="session")
 def ds() -> FRDCDataset:
-    return FRDCDataset._load_debug_dataset()
+    return FRDCDatasetPreset.DEBUG()
 
 
 @pytest.fixture(scope="session")
diff --git a/tests/model_tests/chestnut_dec_may/train.py b/tests/model_tests/chestnut_dec_may/train.py
index 9c2b3c96..8d4aad1c 100644
--- a/tests/model_tests/chestnut_dec_may/train.py
+++ b/tests/model_tests/chestnut_dec_may/train.py
@@ -3,8 +3,13 @@
 This test is done by training a model on the 20201218 dataset, then testing on
 the 20210510 dataset.
 """
-
 import os
+
+# Uncomment this to run the W&B monitoring locally
+# import os
+# from frdc.utils.training import predict, plot_confusion_matrix
+# os.environ["WANDB_MODE"] = "offline"
+
 from pathlib import Path
 
 import lightning as pl
@@ -18,15 +23,14 @@
 from lightning.pytorch.loggers import WandbLogger
 from sklearn.preprocessing import StandardScaler, OrdinalEncoder
 
-from frdc.load import FRDCDataset
-from frdc.load.dataset import FRDCUnlabelledDataset
+from frdc.load.preset import FRDCDatasetPreset as ds
 from frdc.models.inceptionv3 import InceptionV3MixMatchModule
 from frdc.train.frdc_datamodule import FRDCDataModule
+from frdc.utils.training import predict, plot_confusion_matrix
 from model_tests.utils import (
     train_preprocess,
     train_unl_preprocess,
     preprocess,
-    evaluate,
     FRDCDatasetFlipped,
 )
 
@@ -38,32 +42,12 @@ def main(
     val_iters=15,
     lr=1e-3,
 ):
-    run = wandb.init()
-    logger = WandbLogger(name="chestnut_dec_may", project="frdc")
     # Prepare the dataset
-    train_lab_ds = FRDCDataset(
-        "chestnut_nature_park",
-        "20201218",
-        None,
-        transform=train_preprocess,
-    )
-
-    # TODO: This is a hacky impl of the unlabelled dataset, see the docstring
-    #       for future work.
-    train_unl_ds = FRDCUnlabelledDataset(
-        "chestnut_nature_park",
-        "20201218",
-        None,
-        transform=train_unl_preprocess(2),
-    )
-
-    # Subset(train_ds, np.argwhere(train_ds.targets == 0).reshape(-1))
-    val_ds = FRDCDataset(
-        "chestnut_nature_park",
-        "20210510",
-        "90deg43m85pct255deg",
-        transform=preprocess,
+    train_lab_ds = ds.chestnut_20201218(transform=train_preprocess)
+    train_unl_ds = ds.chestnut_20201218.unlabelled(
+        transform=train_unl_preprocess(2)
     )
+    val_ds = ds.chestnut_20210510_43m(transform=preprocess)
 
     oe = OrdinalEncoder(
         handle_unknown="use_encoded_value",
@@ -78,12 +62,12 @@ def main(
     # Prepare the datamodule and trainer
     dm = FRDCDataModule(
         train_lab_ds=train_lab_ds,
-        # Pass in None to use the default supervised DM
-        train_unl_ds=train_unl_ds,
+        train_unl_ds=train_unl_ds,  # None to use supervised DM
         val_ds=val_ds,
         batch_size=batch_size,
         train_iters=train_iters,
         val_iters=val_iters,
+        sampling_strategy="stratified",
     )
 
     trainer = pl.Trainer(
@@ -101,32 +85,41 @@ def main(
                 monitor="val_loss", mode="min", save_top_k=1
             ),
         ],
-        logger=logger,
+        logger=(
+            logger := WandbLogger(name="chestnut_dec_may", project="frdc")
+        ),
     )
+
     m = InceptionV3MixMatchModule(
         n_classes=n_classes,
         lr=lr,
         x_scaler=ss,
         y_encoder=oe,
     )
+    logger.watch(m)
 
     trainer.fit(m, datamodule=dm)
 
     with open(Path(__file__).parent / "report.md", "w") as f:
         f.write(
             f"# Chestnut Nature Park (Dec 2020 vs May 2021)\n"
-            f"- Results: [WandB Report]({run.get_url()})"
+            f"- Results: [WandB Report]({wandb.run.get_url()})"
         )
 
-    fig, acc = evaluate(
+    y_true, y_pred = predict(
         ds=FRDCDatasetFlipped(
             "chestnut_nature_park",
             "20210510",
             "90deg43m85pct255deg",
             transform=preprocess,
         ),
+        model_cls=InceptionV3MixMatchModule,
         ckpt_pth=Path(ckpt.best_model_path),
     )
+    fig, ax = plot_confusion_matrix(y_true, y_pred, oe.categories_[0])
+    acc = np.sum(y_true == y_pred) / len(y_true)
+    ax.set_title(f"Accuracy: {acc:.2%}")
+
     wandb.log({"confusion_matrix": wandb.Image(fig)})
     wandb.log({"eval_accuracy": acc})
 
@@ -140,8 +133,8 @@ def main(
     VAL_ITERS = 15
     LR = 1e-3
 
-    assert wandb.run is None
-    wandb.setup(wandb.Settings(program=__name__, program_relpath=__name__))
+    wandb.login(key=os.environ["WANDB_API_KEY"])
+
     main(
         batch_size=BATCH_SIZE,
         epochs=EPOCHS,
diff --git a/tests/model_tests/utils.py b/tests/model_tests/utils.py
index 593bae11..bc820f53 100644
--- a/tests/model_tests/utils.py
+++ b/tests/model_tests/utils.py
@@ -1,12 +1,8 @@
+from __future__ import annotations
+
 from pathlib import Path
 
-import lightning as pl
-import numpy as np
 import torch
-from matplotlib import pyplot as plt
-from seaborn import heatmap
-from sklearn.metrics import confusion_matrix
-from torch.utils.data import DataLoader
 from torchvision.transforms import RandomVerticalFlip
 from torchvision.transforms.v2 import (
     Compose,
@@ -18,7 +14,7 @@
 )
 from torchvision.transforms.v2 import RandomHorizontalFlip
 
-from frdc.load import FRDCDataset
+from frdc.load.dataset import FRDCDataset
 from frdc.models.inceptionv3 import InceptionV3MixMatchModule
 
 THIS_DIR = Path(__file__).parent
@@ -49,48 +45,6 @@ def __getitem__(self, idx):
             return RandomHorizontalFlip(p=1)(RandomVerticalFlip(p=1)(x)), y
 
 
-def evaluate(
-    ds: FRDCDataset, ckpt_pth: Path | str | None = None
-) -> tuple[plt.Figure, float]:
-    if ckpt_pth is None:
-        # This fetches all possible checkpoints and gets the latest one
-        ckpt_pth = sorted(
-            THIS_DIR.glob("**/*.ckpt"), key=lambda x: x.stat().st_mtime_ns
-        )[-1]
-
-    m = InceptionV3MixMatchModule.load_from_checkpoint(ckpt_pth)
-    # Make predictions
-    trainer = pl.Trainer(logger=False)
-    pred = trainer.predict(m, dataloaders=DataLoader(ds, batch_size=32))
-
-    y_trues = []
-    y_preds = []
-    for y_true, y_pred in pred:
-        y_trues.append(y_true)
-        y_preds.append(y_pred)
-    y_trues = np.concatenate(y_trues)
-    y_preds = np.concatenate(y_preds)
-    acc = (y_trues == y_preds).mean()
-
-    # Plot the confusion matrix
-    cm = confusion_matrix(y_trues, y_preds)
-
-    plt.figure(figsize=(10, 10))
-
-    heatmap(
-        cm,
-        annot=True,
-        xticklabels=m.y_encoder.categories_[0],
-        yticklabels=m.y_encoder.categories_[0],
-        cbar=False,
-    )
-    plt.title(f"Accuracy: {acc:.2%}")
-    plt.tight_layout(pad=3)
-    plt.xlabel("Predicted Label")
-    plt.ylabel("True Label")
-    return plt.gcf(), acc
-
-
 def preprocess(x):
     return Compose(
         [
diff --git a/tests/unit_tests/load/test_frdc_dataset.py b/tests/unit_tests/load/test_frdc_dataset.py
index c0e2c838..0a75425c 100644
--- a/tests/unit_tests/load/test_frdc_dataset.py
+++ b/tests/unit_tests/load/test_frdc_dataset.py
@@ -1,4 +1,5 @@
 from frdc.conf import BAND_CONFIG
+from frdc.load.dataset import FRDCConcatDataset
 from frdc.utils import Rect
 
 
@@ -23,3 +24,14 @@ def test_get_bounds(ds):
     bounds, labels = ds.get_bounds_and_labels()
     assert all([isinstance(b, Rect) for b in bounds])
     assert len(bounds) == len(labels)
+
+
+def test_ds_add_ds_creates_concat_ds(ds):
+    assert isinstance(ds + ds, FRDCConcatDataset)
+    assert len(ds + ds) == len(ds) * 2
+
+
+def test_concat_ds_add_ds_creates_concat_ds(ds):
+    cds = ds + ds
+    assert isinstance(cds + ds, FRDCConcatDataset)
+    assert len(cds + ds) == len(ds) * 3
diff --git a/tests/unit_tests/train/__init__.py b/tests/unit_tests/train/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/tests/unit_tests/train/test_stratified_sampling.py b/tests/unit_tests/train/test_stratified_sampling.py
new file mode 100644
index 00000000..e8019b64
--- /dev/null
+++ b/tests/unit_tests/train/test_stratified_sampling.py
@@ -0,0 +1,47 @@
+from __future__ import annotations
+
+import torch
+from torch.utils.data import DataLoader, TensorDataset
+
+from frdc.train.stratified_sampling import RandomStratifiedSampler
+
+
+def test_stratifed_sampling_has_correct_probs():
+    sampler = RandomStratifiedSampler(["A", "A", "B"])
+
+    assert torch.all(sampler.target_probs == torch.tensor([0.25, 0.25, 0.5]))
+
+
+def test_stratified_sampling_fairly_samples():
+    """This test checks that the stratified sampler works with a dataloader."""
+
+    # This is a simple example of a dataset with 2 classes.
+    # The first 2 samples are class 0, the third is class 1.
+    x = torch.tensor([0, 1, 2])
+    y = ["A", "A", "B"]
+
+    # To check that it's truly stratified, we'll sample 1000 times
+    # then assert that both classes are sampled roughly equally.
+
+    # In this case, the first 2 x should be sampled roughly 250 times,
+    # and the third x should be sampled roughly 500 times.
+
+    num_samples = 1000
+    batch_size = 10
+    dl = DataLoader(
+        TensorDataset(x),
+        batch_size=batch_size,
+        sampler=RandomStratifiedSampler(y, num_samples=num_samples),
+    )
+
+    # Note that when we sample from a TensorDataset, we get a tuple of tensors.
+    # So we need to unpack the tuple.
+    x_samples = torch.cat([x for (x,) in dl])
+
+    assert len(x_samples) == num_samples
+    assert torch.allclose(
+        torch.bincount(x_samples),
+        torch.tensor([250, 250, 500]),
+        # atol is the absolute tolerance, so the result can differ by 50
+        atol=50,
+    )