Merge pull request #5 from lincc-frameworks/awo/update-2026-03-017

drewoldag · web-flow · commit ec8c2692d01d · 2026-03-17T14:30:39.000-07:00
Updated model with current best practices, added getting started notebook
diff --git a/.gitignore b/.gitignore
@@ -148,3 +148,9 @@ _html/
 
 # Project initialization script
 .initialize_new_project.sh
+
+# Default Hyrax results directory
+results/
+docs/notebooks/results/
+docs/pre_executed/results/
+data/
diff --git a/docs/pre_executed/model_usage_example.ipynb b/docs/pre_executed/model_usage_example.ipynb
diff --git a/pyproject.toml b/pyproject.toml
@@ -17,6 +17,8 @@ classifiers = [
 dynamic = ["version"]
 requires-python = ">=3.11"
 dependencies = [
+    "hyrax", # The main dependency of this project
+    "torch", # Used for the example model in this project
 ]
 
 [project.urls]
@@ -30,6 +32,9 @@ dev = [
     "pytest",
     "pytest-cov", # Used to report total code coverage
     "ruff", # Used for static linting of files
+    "numpy", # Required by example notebooks
+    "matplotlib", # Required by example notebooks
+    "scikit-learn", # Required by example notebooks (imported as sklearn)
 ]
 
 [build-system]
diff --git a/src/external_hyrax_example/__init__.py b/src/external_hyrax_example/__init__.py
@@ -1,3 +1,3 @@
-from .example_model import ExampleModel
+from .models.vgg11 import VGG11
 
-__all__ = ["ExampleModel"]
+__all__ = ["VGG11"]
diff --git a/src/external_hyrax_example/default_config.toml b/src/external_hyrax_example/default_config.toml
@@ -1,3 +1,9 @@
-[model]
-[model.ExampleModel]
-layer = 10
+[external_hyrax_example]
+
+[external_hyrax_example.VGG11]
+dropout = 0.5
+num_classes = 10
+batch_norm = true
+
+# The libpath that would be used for runtime config
+# name = "external_hyrax_example.models.vgg11.VGG11"
diff --git a/src/external_hyrax_example/example_model.py b/src/external_hyrax_example/example_model.py
diff --git a/src/external_hyrax_example/models/vgg11.py b/src/external_hyrax_example/models/vgg11.py
@@ -0,0 +1,109 @@
+from typing import Union, cast
+
+import torch
+import torch.nn as nn
+from hyrax.models.model_registry import hyrax_model
+
+cfgs = {
+    "A": [64, "M", 128, "M", 256, 256, "M", 512, 512, "M", 512, 512, "M"],
+}
+
+
+@hyrax_model
+class VGG11(nn.Module):
+    """Copy of the PyTorch VGG11 model for testing and demonstration
+    purposes.
+    https://docs.pytorch.org/vision/main/models/generated/torchvision.models.vgg11.html#torchvision.models.vgg11
+    """
+
+    def __init__(self, config, data_sample=None):
+        """Basic initialization with architecture definition"""
+        super().__init__()
+        if data_sample is None:
+            raise ValueError(
+                "VGG11 expected 'data_sample' to be provided at construction time "
+                "so that input channel dimensions can be inferred, but received None."
+            )
+        image_sample = data_sample[0]
+        self.in_channels, width, height = image_sample.shape
+        self.config = config
+
+        dropout = self.config["external_hyrax_example"]["VGG11"]["dropout"]
+        num_classes = self.config["external_hyrax_example"]["VGG11"]["num_classes"]
+        batch_norm = self.config["external_hyrax_example"]["VGG11"]["batch_norm"]
+
+        self.features = self._make_layers(cfgs["A"], batch_norm=batch_norm)
+        self.avgpool = nn.AdaptiveAvgPool2d((7, 7))
+        self.classifier = nn.Sequential(
+            nn.Linear(512 * 7 * 7, 4096),
+            nn.ReLU(True),
+            nn.Dropout(p=dropout),
+            nn.Linear(4096, 4096),
+            nn.ReLU(True),
+            nn.Dropout(p=dropout),
+            nn.Linear(4096, num_classes),
+        )
+
+    def _make_layers(self, cfg: list[Union[str, int]], batch_norm: bool = False) -> nn.Sequential:
+        """Helper function to create the convolutional layers of the VGG11 architecture"""
+        layers: list[nn.Module] = []
+        in_channels = self.in_channels
+        for v in cfg:
+            if v == "M":
+                layers += [nn.MaxPool2d(kernel_size=2, stride=2)]
+            else:
+                v = cast(int, v)
+                conv2d = nn.Conv2d(in_channels, v, kernel_size=3, padding=1)
+                if batch_norm:
+                    layers += [conv2d, nn.BatchNorm2d(v), nn.ReLU(inplace=True)]
+                else:
+                    layers += [conv2d, nn.ReLU(inplace=True)]
+                in_channels = v
+        return nn.Sequential(*layers)
+
+    def forward(self, batch: tuple) -> torch.Tensor:
+        """The innermost logic in the forward pass"""
+        x, _ = batch
+        x = self.features(x)
+        x = self.avgpool(x)
+        x = torch.flatten(x, 1)
+        x = self.classifier(x)
+        return x
+
+    def infer_batch(self, batch):
+        """The innermost logic in the inference loop"""
+        return self(batch)
+
+    def train_batch(self, batch):
+        """The innermost logic in the training loop"""
+        _, labels = batch
+        self.optimizer.zero_grad()
+        outputs = self(batch)
+        loss = self.criterion(outputs, labels)
+        loss.backward()
+        self.optimizer.step()
+        return {"loss": loss.item()}
+
+    def validate_batch(self, batch):
+        """The innermost logic in the validation loop"""
+        _, labels = batch
+        outputs = self(batch)
+        loss = self.criterion(outputs, labels)
+        return {"loss": loss.item()}
+
+    def test_batch(self, batch):
+        """The innermost logic in the testing loop"""
+        _, labels = batch
+        outputs = self(batch)
+        loss = self.criterion(outputs, labels)
+        return {"loss": loss.item()}
+
+    @staticmethod
+    def prepare_data(data_dict):
+        """Method that converts the data in dictionary into the form the model expects"""
+        image = data_dict["data"]["image"]
+
+        label = None
+        if "label" in data_dict["data"]:
+            label = data_dict["data"]["label"]
+        return (image, label)