From c3043b512d5d4f2a0ad9d53bcd06a9b290e8db92 Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Fri, 20 Jun 2025 15:38:28 -0700
Subject: [PATCH 1/8] data augmentations import

---
 learning/training/training.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/learning/training/training.py b/learning/training/training.py
index 5dd578c..35151db 100644
--- a/learning/training/training.py
+++ b/learning/training/training.py
@@ -33,6 +33,8 @@
 from fastai.vision.utils import get_image_files
 from torch import nn
 
+from data_augmentations import AlbumentationsTransform, get_train_aug, get_valid_aug
+
 
 def parse_args() -> Namespace:
     arg_parser = ArgumentParser("Train command classification networks.")
@@ -155,6 +157,10 @@ def get_dls(args: Namespace, data_paths: list):
             args, data_paths, image_filenames, label_func
         )
     else:
+        albumentations_tfms = AlbumentationsTransform(
+            get_train_aug(), get_valid_aug()
+        )  # object to provide data augmentation logic
+
         return ImageDataLoaders.from_name_func(
             data_paths[0],  # TODO: find a better place to save models
             image_filenames,
@@ -163,6 +169,9 @@ def get_dls(args: Namespace, data_paths: list):
             shuffle=True,
             bs=args.batch_size,
             item_tfms=Resize(args.image_resize),
+            batch_tfms=[
+                albumentations_tfms
+            ],  # apply data augmentations by batch after resizing
         )
 
 

From 28003f49037880410434f467c30956b41edde5a3 Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Fri, 20 Jun 2025 15:41:04 -0700
Subject: [PATCH 2/8] data augmentations class

---
 learning/training/data_augmentations.py | 89 +++++++++++++++++++++++++
 1 file changed, 89 insertions(+)
 create mode 100644 learning/training/data_augmentations.py

diff --git a/learning/training/data_augmentations.py b/learning/training/data_augmentations.py
new file mode 100644
index 0000000..0ceada9
--- /dev/null
+++ b/learning/training/data_augmentations.py
@@ -0,0 +1,89 @@
+import albumentations as A
+import numpy as np
+from fastai.vision.core import PILImage
+from fastai.vision.augment import RandTransform
+
+
+class AlbumentationsTransform(RandTransform):
+    """Class that handles albumentations transformations during training."""
+
+    def __init__(self, train_aug, valid_aug=None, split_idx=None):
+        """Constructor for AlbumentationsTransform."""
+        super().__init__()  # calls base class (RandTransform) constructor
+        self.train_aug = train_aug
+        self.valid_aug = (
+            valid_aug or train_aug
+        )  # defaults to training augmentations if no validation augmentations are provided
+        self.split_idx = split_idx  # indicates whether the transform is applied to training or validation data
+        self.order = 2  # apply after resizing
+
+    def before_call(self, b, split_idx):
+        """Called before the transform is applied to set the split index so we know if it's training or validation."""
+        self.idx = split_idx
+
+    def encodes(self, img: PILImage):
+        """Apply the Albumentations transformations to the input image."""
+        aug = (
+            self.train_aug if self.idx == 0 else self.valid_aug
+        )  # apply the appropriate augmentation
+        image = np.array(img)  # albumentations works with numpy arrays
+        image = aug(image=image)[
+            "image"
+        ]  # extract the image from the augmentation result
+        return PILImage.create(image)  # convert back to PILImage for compatibility
+
+
+def get_train_aug():
+    """Data augmentations applied to training data."""
+    return A.Compose(
+        [
+            A.Affine(
+                scale=(0.9, 1.1),  # scale by 90%-110% of original size
+                translate_percent=0.1,  # shift horizontally or vertically by up to 10% of its width/height
+                rotate=(-10, 10),  # rotate between -10 and 10 degrees
+                p=0.5,  # 50 chance to apply affine transformations
+            ),
+            A.RandomBrightnessContrast(
+                p=0.2  # 20% chance to adjust brightness and contrast
+            ),
+            # possible augmentations to add:
+            # A.Perspective(
+            #    scale=(0.05, 0.1),  # apply perspective transformation with a scale factor between 5% and 10%
+            #    p=0.5  # 50% chance to apply perspective transformation
+            # ),
+            # A.HueSaturationValue(
+            #    hue_shift_limit=20,  # shift hue by up to 20 degrees
+            #    sat_shift_limit=20,  # shift saturation by up to 20%
+            #    val_shift_limit=20,  # shift value by up to 20%
+            #    p=0.5  # 50% chance to apply hue, saturation, and value adjustments
+            # ),
+            # A.RandomGamma(
+            #    gamma_limit=(80, 120),  # adjust gamma between 80% and 120%
+            #    p=0.5  # 50% chance to apply gamma adjustment
+            # ),
+            # A.RGBShift(
+            #    r_shift_limit=20,  # shift red channel by up to 20
+            #    g_shift_limit=20,  # shift green channel by up to 20
+            #    b_shift_limit=20,  # shift blue channel by up to 20
+            #    p=0.5  # 50% chance to apply RGB shift
+            # ),
+            # A.MotionBlur(
+            #    blur_limit=(3, 7),  # apply motion blur with a kernel size between 3 and 7
+            #    p=0.5  # 50% chance to apply motion blur
+            # ),
+            # A.GaussianNoise(
+            #    var_limit=(10, 50),  # add Gaussian noise with a variance between 10 and 50
+            #    p=0.5  # 50% chance to apply Gaussian noise
+            # ),
+            # A.OpticalDistortion(
+            #    distort_limit=0.05,  # apply optical distortion with a limit of 5%
+            #    shift_limit=0.05,  # shift the image by up to 5%
+            #    p=0.5  # 50% chance to apply optical distortion
+            # ),
+        ]
+    )
+
+
+def get_valid_aug():
+    """Data augmentations applied to validation data (none)."""
+    return A.Compose([])

From 559d90dfd2f052938407793e2c48582d4c9e5ed0 Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Fri, 20 Jun 2025 16:58:46 -0700
Subject: [PATCH 3/8] implemented program to download entire wandb projects

---
 download_wandb_project.py | 57 +++++++++++++++++++++++++++++++++++++++
 1 file changed, 57 insertions(+)
 create mode 100644 download_wandb_project.py

diff --git a/download_wandb_project.py b/download_wandb_project.py
new file mode 100644
index 0000000..a99d45f
--- /dev/null
+++ b/download_wandb_project.py
@@ -0,0 +1,57 @@
+import wandb
+import os
+import argparse
+
+# example usage:
+# python download_wandb_project.py Summer2024Official --output_dir Summer2024Official_downloads
+
+
+def download_project_runs(project: str, output_dir: str):
+    """
+    Download all runs and their artifacts from a specified WandB project.
+
+    Args:
+        project (str): The name of the WandB project.
+        output_dir (str): The directory to save downloaded runs and artifacts.
+    """
+    api = wandb.Api()  # Initialize the WandB API
+
+    runs = api.runs(f"arcslaboratory/{project}")  # Get all runs for the project
+    print(f"Found {len(runs)} runs in project '{project}'")
+
+    os.makedirs(output_dir, exist_ok=True)  # Ensure output directory exists
+
+    for run in runs:
+        run_dir = os.path.join(output_dir, run.id)  # Directory for this run
+        os.makedirs(run_dir, exist_ok=True)  # Create directory for the run
+
+        print(f"\nDownloading run: {run.name} ({run.id})")
+
+        # Download all files associated with the run
+        for file in run.files():
+            print(f"File: {file.name}")
+            file.download(root=run_dir, replace=True)  # Download file to run_dir
+
+        # Download all logged artifacts for the run
+        for artifact in run.logged_artifacts():
+            artifact_name = f"{artifact.name.replace('/', '_')}:{artifact.version}"  # Format artifact name
+            print(f"Artifact: {artifact_name}")
+            artifact.download(root=run_dir)  # Download artifact to run_dir
+
+
+if __name__ == "__main__":
+    # Set up command-line argument parsing
+    parser = argparse.ArgumentParser(
+        description="Download all runs and artifacts from a WandB project."
+    )
+    parser.add_argument(
+        "project", help="WandB project name"
+    )  # Required project name argument
+    parser.add_argument(
+        "--output_dir",
+        default="wandb_downloads",
+        help="Directory to save the runs and artifacts",
+    )
+
+    args = parser.parse_args()  # Parse command-line arguments
+    download_project_runs(args.project, args.output_dir)  # Run the download function

From 82caa439472416e23f153f94fdd4a506e555d1e5 Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Mon, 7 Jul 2025 11:11:22 -0700
Subject: [PATCH 4/8] edited y_from_filename to handle the filename convention
 from the data collection notebook

---
 learning/training/training.py | 35 ++++++++++++++++++++++-------------
 1 file changed, 22 insertions(+), 13 deletions(-)

diff --git a/learning/training/training.py b/learning/training/training.py
index 35151db..300d922 100644
--- a/learning/training/training.py
+++ b/learning/training/training.py
@@ -128,19 +128,28 @@ def get_angle_from_filename(filename: str) -> float:
 
 
 def y_from_filename(rotation_threshold: float, filename: str) -> str:
-    """Extracts the direction label from the filename of an image.
-
-    Example: "path/to/file/001_000011_-1p50.png" --> "right"
-    """
-    filename_stem = Path(filename).stem
-    angle = float(filename_stem.split("_")[2].replace("p", "."))
-
-    if angle > rotation_threshold:
-        return "left"
-    elif angle < -rotation_threshold:
-        return "right"
-    else:
-        return "forward"
+    path = Path(filename)
+    filename_stem = path.stem
+    parts = filename_stem.split("_")
+    direction_keywords = {"left", "right", "forward"}
+
+    # Case 1: filename starts with a known direction keyword
+    if parts[0].lower() in direction_keywords:
+        return parts[0].lower()
+
+    # Case 2: try to parse angle from filename
+    try:
+        angle_str = parts[2].replace("p", ".")
+        angle = float(angle_str)
+        if angle > rotation_threshold:
+            return "left"
+        elif angle < -rotation_threshold:
+            return "right"
+        else:
+            return "forward"
+    except (IndexError, ValueError):
+        # Fall back to folder name if all else fails
+        return path.parent.name.lower()
 
 
 def get_dls(args: Namespace, data_paths: list):

From 4b8ec89503fe202ee3a4405c7a13625e2f81ee21 Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Mon, 7 Jul 2025 11:11:48 -0700
Subject: [PATCH 5/8] ignore .jpg files

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index 631e10c..d474680 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,4 +1,5 @@
 *.png
+*.jpg
 *.mp4
 *.gif
 *filelist.txt

From de73477c409e90dc0e4943776e54f1cc226e5d2c Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Mon, 7 Jul 2025 11:23:59 -0700
Subject: [PATCH 6/8] index error

---
 learning/training/training.py | 31 +++++++++++++++++--------------
 1 file changed, 17 insertions(+), 14 deletions(-)

diff --git a/learning/training/training.py b/learning/training/training.py
index 300d922..3315feb 100644
--- a/learning/training/training.py
+++ b/learning/training/training.py
@@ -133,23 +133,26 @@ def y_from_filename(rotation_threshold: float, filename: str) -> str:
     parts = filename_stem.split("_")
     direction_keywords = {"left", "right", "forward"}
 
-    # Case 1: filename starts with a known direction keyword
+    # Case 1: filename starts with a known direction
     if parts[0].lower() in direction_keywords:
         return parts[0].lower()
 
-    # Case 2: try to parse angle from filename
-    try:
-        angle_str = parts[2].replace("p", ".")
-        angle = float(angle_str)
-        if angle > rotation_threshold:
-            return "left"
-        elif angle < -rotation_threshold:
-            return "right"
-        else:
-            return "forward"
-    except (IndexError, ValueError):
-        # Fall back to folder name if all else fails
-        return path.parent.name.lower()
+    # Case 2: try to parse angle from third underscore-separated part
+    if len(parts) >= 3:
+        try:
+            angle_str = parts[2].replace("p", ".")
+            angle = float(angle_str)
+            if angle > rotation_threshold:
+                return "left"
+            elif angle < -rotation_threshold:
+                return "right"
+            else:
+                return "forward"
+        except ValueError:
+            pass  # fall through to fallback
+
+    # Fallback: get label from parent directory
+    return path.parent.name.lower()
 
 
 def get_dls(args: Namespace, data_paths: list):

From a864c8a8195e803d1d4568a9bd01d669f282e1a8 Mon Sep 17 00:00:00 2001
From: Tommy <tfrw2023@mymail.pomona.edu>
Date: Mon, 7 Jul 2025 15:52:58 -0700
Subject: [PATCH 7/8] updated documentation to reflect data augmentation
 changes, added argument to enable/disable augmentations in training

---
 README.md                                     |  3 ++-
 learning/{training => }/data_augmentations.py |  0
 learning/{training => }/training.py           | 15 +++++++++------
 3 files changed, 11 insertions(+), 7 deletions(-)
 rename learning/{training => }/data_augmentations.py (100%)
 rename learning/{training => }/training.py (96%)

diff --git a/README.md b/README.md
index 90e054e..e787a65 100644
--- a/README.md
+++ b/README.md
@@ -54,11 +54,12 @@ python upload_data.py DATA_NAME PROJECT_NAME "Sample description of uploading ru
 # This should be run on a system with a GPU (e.g., our server)
 # training.py, sbatch scripts, and datasets should be in the same directory on the server (could be learning)
 cd learning
-python training.py MODEL_NAME PROJECT_NAME "Sample description of training run..." ARCHITECTURE_NAME DATA_NAME(S) --local_data
+python training.py MODEL_NAME PROJECT_NAME "Sample description of training run..." ARCHITECTURE_NAME DATA_NAME(S) --local_data --use_augmentation
 
 # Performs inference
 # This will run on a system that can run Unreal Engine
 # Note: MODEL_NAME_FROM_WANDB can be found in arcslaboratory -> Projects -> PROJECT_NAME -> Artifacts
+# data_augmentations.py must be in same directory as inference.py if performing inference on a model trained with data augmentation
 cd learning
 python inference.py INFERENCE_NAME PROJECT_NAME "Sample description of inference run..." MODEL_NAME_FROM_WANDB:VERSION IMAGE_SAVE_FOLDER_NAME
 ~~~
diff --git a/learning/training/data_augmentations.py b/learning/data_augmentations.py
similarity index 100%
rename from learning/training/data_augmentations.py
rename to learning/data_augmentations.py
diff --git a/learning/training/training.py b/learning/training.py
similarity index 96%
rename from learning/training/training.py
rename to learning/training.py
index 3315feb..0ff0e84 100644
--- a/learning/training/training.py
+++ b/learning/training.py
@@ -72,6 +72,11 @@ def parse_args() -> Namespace:
     )
 
     # Training configuration
+    arg_parser.add_argument(
+        "--use_augmentation",
+        action="store_true",
+        help="Enable data augmentation if included (default is off).",
+    )
     arg_parser.add_argument(
         "--num_epochs", type=int, default=10, help="Number of training epochs."
     )
@@ -169,10 +174,6 @@ def get_dls(args: Namespace, data_paths: list):
             args, data_paths, image_filenames, label_func
         )
     else:
-        albumentations_tfms = AlbumentationsTransform(
-            get_train_aug(), get_valid_aug()
-        )  # object to provide data augmentation logic
-
         return ImageDataLoaders.from_name_func(
             data_paths[0],  # TODO: find a better place to save models
             image_filenames,
@@ -182,8 +183,10 @@ def get_dls(args: Namespace, data_paths: list):
             bs=args.batch_size,
             item_tfms=Resize(args.image_resize),
             batch_tfms=[
-                albumentations_tfms
-            ],  # apply data augmentations by batch after resizing
+                AlbumentationsTransform(get_train_aug(), get_valid_aug())
+            ]  # object to provide data augmentation logic
+            if args.use_augmentation  # apply data augmentations by batch after resizing if indicated in args
+            else [],
         )
 
 

From 1a73076d89a8ee01d36ce79f99596f376307becd Mon Sep 17 00:00:00 2001
From: tonnyryam <74562524+tonnyryam@users.noreply.github.com>
Date: Tue, 15 Jul 2025 10:29:39 -0700
Subject: [PATCH 8/8] now using fastai instead of albumentations for data
 augmentations

---
 learning/training.py | 28 ++++++++++++++++++++++------
 1 file changed, 22 insertions(+), 6 deletions(-)

diff --git a/learning/training.py b/learning/training.py
index 0ff0e84..d311fa8 100644
--- a/learning/training.py
+++ b/learning/training.py
@@ -33,8 +33,7 @@
 from fastai.vision.utils import get_image_files
 from torch import nn
 
-from data_augmentations import AlbumentationsTransform, get_train_aug, get_valid_aug
-
+from fastai.vision.all import aug_transforms, Normalize, imagenet_stats
 
 def parse_args() -> Namespace:
     arg_parser = ArgumentParser("Train command classification networks.")
@@ -133,6 +132,10 @@ def get_angle_from_filename(filename: str) -> float:
 
 
 def y_from_filename(rotation_threshold: float, filename: str) -> str:
+    """Extracts the direction label from the filename of an image.
+
+    Example: "path/to/file/001_000011_-1p50.png" --> "right"
+    """
     path = Path(filename)
     filename_stem = path.stem
     parts = filename_stem.split("_")
@@ -183,10 +186,23 @@ def get_dls(args: Namespace, data_paths: list):
             bs=args.batch_size,
             item_tfms=Resize(args.image_resize),
             batch_tfms=[
-                AlbumentationsTransform(get_train_aug(), get_valid_aug())
-            ]  # object to provide data augmentation logic
-            if args.use_augmentation  # apply data augmentations by batch after resizing if indicated in args
-            else [],
+                *aug_transforms(  # apply fastai's data augmentation transforms
+                    size=args.image_resize,  # scales images to be image_resize x image_resize
+                    flip_vert=False,  # vertical flip is not used
+                    max_rotate=10.0,  # rotate images by up to 10 degrees
+                    min_zoom=0.9,  # zoom images down to 90% of their original size
+                    max_zoom=1.1,  # zoom images up to 110% of their original size
+                    max_lighting=0.2,  # adjust lighting by up to 20%
+                    max_warp=0.2,  # warp images by up to 20%
+                    p_affine=0.5,  # probability of applying affine transformations (rotation, zoom, warp)
+                    p_lighting=0.2,  # probability of applying lighting adjustments
+                ),
+                Normalize.from_stats(
+                    *imagenet_stats
+                ),  # normalize images using ImageNet statistics
+            ]
+            if args.use_augmentation
+            else None,
         )