OSU-NLP-Group
diff --git a/‎analysis.py
+1-1 b/‎analysis.py
+1-1
diff --git a/‎logbook.md
+16-3 b/‎logbook.md
+16-3
diff --git a/‎main.py
+1-1 b/‎main.py
+1-1
diff --git a/‎pyproject.toml
+2-2 b/‎pyproject.toml
+2-2
diff --git a/‎saev/__init__.py
+10-7 b/‎saev/__init__.py
+10-7
diff --git a/‎saev/activations_store.py
-126 b/‎saev/activations_store.py
-126
diff --git a/‎saev/config.py
+2-108 b/‎saev/config.py
+2-108
@@ -192,7 +192,7 @@ def main(
         n_images: number of images to use. Use a smaller number for debugging.
         k_top_images: the number of top images to store per neuron.
     """
-    _, sae, acts_store = saev.utils.Session.from_disk(ckpt_path)
+    _, sae, acts_store = saev.Session.from_disk(ckpt_path)
     get_feature_data(
         sae,
         acts_store,
 
@@ -89,12 +89,25 @@ With this in mind, there are several minor changes I want to make before I do so
 
 1. Removing `transformer-lens` [done, commit [18612b7](https://github.com/samuelstevens/saev/commit/18612b75988c32ae8ab3db6656b44a442f3f7641)]
 2. Removing HookedVisionTransformer [done, commit [c7ba7c7](https://github.com/samuelstevens/saev/commit/c7ba7c72c76472fd8cf2e7b2dc668d03a15b803d)]
-3. OpenCLIP instead of huggingface `transformers`
+3. OpenCLIP instead of huggingface `transformers` [done, testing]
 4. Pre-computing ViT activations
 
 I'm going to do each of these independently using a set of runs as references.
 
 # 10/22/2024
 
-* Removed HookedVisionTransformer (see above)
-* Checkpoint [v6jto37s](https://wandb.ai/samuelstevens/saev/runs/wwb20pa0) worked
+Removed HookedVisionTransformer (see above)
+Checkpoint [v6jto37s](https://wandb.ai/samuelstevens/saev/runs/wwb20pa0) worked for training, analysis, and app data.
+
+Testing an implementation using OpenCLIP instead of `transformers`.
+Assuming it works (which seems likely given that the loss curve is identical), then I will pre-compute the activations, save them as a numpy array to disk, and memmap them during training rather than computing them.
+I expect this to take a little bit because I had issues with shuffling and such in the analysis step earlier.
+I think the best strategy is to work backwards.
+The `generate_app_data.py` script doesn't need an activation store at all.
+So I will start with the `analysis.py` script and add a new activations store class that meets the same interface as the original (maybe not for the constructor).
+Then I will verify that the analysis script works correctly.
+
+Only after that will I use the new class in training.
+Working with the analysis script is a shorter feedback loop.
+
+# 10/23/2024
@@ -18,4 +18,4 @@
         torch.backends.cudnn.benchmark = True
         torch.backends.cudnn.deterministic = False
 
-    saev.training.train(tyro.cli(saev.Config))
+    saev.train(tyro.cli(saev.Config))
@@ -1,7 +1,7 @@
 [project]
 name = "saev"
 version = "0.1.0"
-description = "Add your description here"
+description = "Sparse autoencoders for vision transformers in PyTorch"
 readme = "README.md"
 requires-python = ">=3.11"
 dependencies = [
@@ -10,10 +10,10 @@ dependencies = [
     "einops>=0.8.0",
     "jaxtyping>=0.2.34",
     "marimo>=0.9.10",
+    "open-clip-torch>=2.28.0",
     "pillow>=11.0.0",
     "torch>=2.5.0",
     "tqdm>=4.66.5",
-    "transformers>=4.45.2",
     "tyro>=0.8.12",
     "wandb>=0.18.5",
 ]
 
@@ -1,14 +1,17 @@
-from . import training, utils
-from .activations_store import ActivationsStore
-from .config import Config
-from .vits import RecordedVit
-from .sparse_autoencoder import SparseAutoencoder
+from .modeling import (
+    ActivationsStore,
+    Config,
+    RecordedVit,
+    Session,
+    SparseAutoencoder,
+)
+from .training import train
 
 __all__ = [
     "ActivationsStore",
     "Config",
     "RecordedVit",
     "SparseAutoencoder",
-    "training",
-    "utils",
+    "Session",
+    "train",
 ]
@@ -1,110 +1,4 @@
-from dataclasses import dataclass
-
-import beartype
-import torch
-
-import wandb
-
-
-@beartype.beartype
-@dataclass
-class Config:
-    """
-    Configuration for training a sparse autoencoder on a vision transformer.
-    """
-
-    # Data Generating Function (Model + Training Distibuion)
-    image_width: int = 224
-    image_height: int = 224
-    model_name: str = "openai/clip-vit-large-patch14"
-    module_name: str = "resid"
-    block_layer: int = -2
-    dataset_path: str = "ILSVRC/imagenet-1k"
-
-    # SAE Parameters
-    d_in: int = 1024
-
-    # Activation Store Parameters
-    total_training_tokens: int = 2_621_440
-    n_batches_in_store: int = 15
-    store_size: int | None = None
-    vit_batch_size: int = 1024
-
-    # SAE Parameters
-    expansion_factor: int = 64
-
-    # Training Parameters
-    l1_coefficient: float = 0.00008
-    lr: float = 0.0004
-    lr_warm_up_steps: int = 500
-    batch_size: int = 1024
-
-    # Resampling protocol args
-    use_ghost_grads: bool = True
-    feature_sampling_window: int = 64
-    resample_batches: int = 32
-    feature_reinit_scale: float = 0.2
-    dead_feature_window: int = 64
-    dead_feature_estimation_method: str = "no_fire"
-    dead_feature_threshold: float = 1e-6
-
-    # WANDB
-    log_to_wandb: bool = True
-    wandb_project: str = "saev"
-    wandb_log_freq: int = 10
-
-    # Misc
-    device: str = "cuda"
-    seed: int = 42
-    dtype: torch.dtype = torch.float32
-    checkpoint_path: str = "checkpoints"
-
-    def __post_init__(self):
-        self.store_size = self.n_batches_in_store * self.batch_size
-
-        self.d_sae = self.d_in * self.expansion_factor
-
-        self.run_name = f"{self.d_sae}-L1-{self.l1_coefficient}-LR-{self.lr}-Tokens-{self.total_training_tokens:3.3e}"
-
-        self.device = torch.device(self.device)
-
-        unique_id = wandb.util.generate_id()
-        self.checkpoint_path = f"{self.checkpoint_path}/{unique_id}"
-
-        print(
-            f"Run name: {self.d_sae}-L1-{self.l1_coefficient}-LR-{self.lr}-Tokens-{self.total_training_tokens:3.3e}"
-        )
-        # Print out some useful info:
-
-        total_training_steps = self.total_training_tokens // self.batch_size
-        print(f"Total training steps: {total_training_steps}")
-
-        total_wandb_updates = total_training_steps // self.wandb_log_freq
-        print(f"Total wandb updates: {total_wandb_updates}")
-
-        # how many times will we sample dead neurons?
-        # assert self.dead_feature_window <= self.feature_sampling_window, "dead_feature_window must be smaller than feature_sampling_window"
-        n_feature_window_samples = total_training_steps // self.feature_sampling_window
-        print(
-            f"n_tokens_per_feature_sampling_window (millions): {(self.feature_sampling_window * self.batch_size) / 10** 6}"
-        )
-        print(
-            f"n_tokens_per_dead_feature_window (millions): {(self.dead_feature_window * self.batch_size) / 10** 6}"
-        )
-
-        if self.use_ghost_grads:
-            print("Using Ghost Grads.")
-
-        print(
-            f"We will reset the sparsity calculation {n_feature_window_samples} times."
-        )
-        print(
-            f"Number of tokens when resampling: {self.resample_batches * self.batch_size}"
-        )
-        print(
-            f"Number tokens in sparsity calculation window: {self.feature_sampling_window * self.batch_size:.2e}"
-        )
-
+from . import modeling
 
 #################
 # COMPATIBILITY #
@@ -115,4 +9,4 @@ def __post_init__(self):
 # The classes are the same, just named differently.
 
 
-ViTSAERunnerConfig = Config
+ViTSAERunnerConfig = modeling.Config