re-add notebooks as tests

mivanit · mivanit · commit 7e833331e3e2 · 2025-09-30T12:03:55.000+01:00
diff --git a/tests/clustering/scripts/cluster_resid_mlp.py b/tests/clustering/scripts/cluster_resid_mlp.py
@@ -0,0 +1,198 @@
+# %%
+from typing import Any
+
+import matplotlib.pyplot as plt
+import torch
+from muutils.dbg import dbg_auto
+from torch import Tensor
+
+from spd.clustering.activations import (
+    ProcessedActivations,
+    component_activations,
+    process_activations,
+)
+from spd.clustering.merge import merge_iteration, merge_iteration_ensemble
+from spd.clustering.merge_config import MergeConfig
+from spd.clustering.merge_history import MergeHistory, MergeHistoryEnsemble
+from spd.clustering.merge_sweep import sweep_multiple_parameters
+from spd.clustering.plotting.activations import plot_activations
+from spd.clustering.plotting.merge import (
+    plot_dists_distribution,
+    plot_merge_iteration,
+)
+from spd.configs import Config
+from spd.experiments.resid_mlp.resid_mlp_dataset import ResidMLPDataset
+from spd.models.component_model import ComponentModel, SPDRunInfo
+from spd.registry import EXPERIMENT_REGISTRY
+from spd.utils.data_utils import DatasetGeneratedDataLoader
+
+DEVICE: str = "cuda" if torch.cuda.is_available() else "cpu"
+
+# magic autoreload
+# %load_ext autoreload
+# %autoreload 2
+
+# %%
+# Load model
+# ============================================================
+_CANONICAL_RUN: str | None = EXPERIMENT_REGISTRY["resid_mlp2"].canonical_run
+assert _CANONICAL_RUN is not None, "No canonical run found for resid_mlp2 experiment"
+SPD_RUN: SPDRunInfo = SPDRunInfo.from_path(_CANONICAL_RUN)
+MODEL: ComponentModel = ComponentModel.from_pretrained(SPD_RUN.checkpoint_path)
+MODEL.to(DEVICE)
+SPD_CONFIG: Config = SPD_RUN.config
+
+# %%
+# Setup dataset and dataloader
+# ============================================================
+N_SAMPLES: int = 128
+
+DATASET: ResidMLPDataset = ResidMLPDataset(
+    n_features=MODEL.target_model.config.n_features,  # pyright: ignore[reportAttributeAccessIssue, reportArgumentType],
+    feature_probability=SPD_CONFIG.task_config.feature_probability,  # pyright: ignore[reportAttributeAccessIssue]
+    device=DEVICE,
+    calc_labels=False,
+    label_type=None,
+    act_fn_name=None,
+    label_fn_seed=None,
+    label_coeffs=None,
+    data_generation_type=SPD_CONFIG.task_config.data_generation_type,  # pyright: ignore[reportAttributeAccessIssue]
+)
+
+dbg_auto(
+    dict(
+        n_features=DATASET.n_features,
+        feature_probability=DATASET.feature_probability,
+        data_generation_type=DATASET.data_generation_type,
+    )
+)
+DATALOADER = DatasetGeneratedDataLoader(DATASET, batch_size=N_SAMPLES, shuffle=False)
+
+# %%
+# Get component activations
+# ============================================================
+COMPONENT_ACTS: dict[str, Tensor] = component_activations(
+    model=MODEL,
+    device=DEVICE,
+    dataloader=DATALOADER,
+    sigmoid_type="hard",
+)
+
+dbg_auto(COMPONENT_ACTS)
+
+# %%
+
+FILTER_DEAD_THRESHOLD: float = 0.1
+
+# Process activations
+# ============================================================
+PROCESSED_ACTIVATIONS: ProcessedActivations = process_activations(
+    COMPONENT_ACTS,
+    filter_dead_threshold=FILTER_DEAD_THRESHOLD,
+    sort_components=False,  # Test the new sorting functionality
+)
+
+
+plot_activations(
+    processed_activations=PROCESSED_ACTIVATIONS,
+    save_pdf=False,
+)
+
+# %%
+# run the merge iteration
+# ============================================================
+
+MERGE_CFG: MergeConfig = MergeConfig(
+    activation_threshold=0.1,
+    alpha=1,
+    iters=int(PROCESSED_ACTIVATIONS.n_components_alive * 0.9),
+    merge_pair_sampling_method="range",
+    merge_pair_sampling_kwargs={"threshold": 0.0},
+    pop_component_prob=0,
+    filter_dead_threshold=FILTER_DEAD_THRESHOLD,
+)
+
+
+def _plot_func(
+    costs: torch.Tensor,
+    # merge_history: MergeHistory,
+    current_merge: Any,
+    current_coact: torch.Tensor,
+    # current_act_mask: torch.Tensor,
+    i: int,
+    # k_groups: int,
+    # activation_mask_orig: torch.Tensor,
+    component_labels: list[str],
+    # sweep_params: dict[str, Any],
+    **kwargs: Any,
+) -> None:
+    assert kwargs
+    if (i % 50 == 0 and i > 0) or i == 1:
+        # latest = merge_history.latest()
+        # latest['merges'].plot()
+        plot_merge_iteration(
+            current_merge=current_merge,
+            current_coact=current_coact,
+            costs=costs,
+            iteration=i,
+            component_labels=component_labels,
+            show=True,  # Show the plot interactively
+        )
+
+
+MERGE_HIST: MergeHistory = merge_iteration(
+    activations=PROCESSED_ACTIVATIONS.activations,
+    merge_config=MERGE_CFG,
+    component_labels=PROCESSED_ACTIVATIONS.labels,
+    plot_callback=_plot_func,
+)
+
+# %%
+# Plot merge history
+# ============================================================
+
+# plt.hist(mh[270]["merges"].components_per_group, bins=np.linspace(0, 56, 57))
+# plt.yscale("log")
+# plt.xscale("log")
+
+
+# %%
+# compute and plot distances in an ensemble
+# ============================================================
+
+ENSEMBLE: MergeHistoryEnsemble = merge_iteration_ensemble(
+    activations=PROCESSED_ACTIVATIONS.activations,
+    component_labels=PROCESSED_ACTIVATIONS.labels,
+    merge_config=MERGE_CFG,
+    ensemble_size=4,
+)
+
+DISTANCES = ENSEMBLE.get_distances(method="perm_invariant_hamming")
+
+plot_dists_distribution(
+    distances=DISTANCES,
+    mode="points",
+    # label="v1"
+)
+plt.legend()
+
+
+# %%
+# do sweeps
+# ============================================================
+
+SWEEP_RESULTS: dict[str, Any] = sweep_multiple_parameters(
+    activations=PROCESSED_ACTIVATIONS.activations,
+    parameter_sweeps={
+        "alpha": [1, 5],
+        # "check_threshold": [0.0001, 0.001, 0.01, 0.1, 0.5],
+        # "pop_component_prob": [0.0001, 0.01, 0.5],
+    },
+    base_config=MERGE_CFG.model_dump(mode="json"),  # pyright: ignore[reportArgumentType],
+    component_labels=PROCESSED_ACTIVATIONS.labels,
+    ensemble_size=4,
+)
+
+# Show all plots
+for param_name, (ensembles, fig, ax) in SWEEP_RESULTS.items():  # noqa: B007
+    plt.show()
diff --git a/tests/clustering/scripts/cluster_ss.py b/tests/clustering/scripts/cluster_ss.py
@@ -0,0 +1,112 @@
+# %%
+
+import matplotlib.pyplot as plt
+import numpy as np
+import torch
+from jaxtyping import Int
+from muutils.dbg import dbg_auto
+from torch import Tensor
+
+from spd.clustering.activations import (
+    ProcessedActivations,
+    component_activations,
+    process_activations,
+)
+from spd.clustering.merge import merge_iteration_ensemble
+from spd.clustering.merge_config import MergeConfig
+from spd.clustering.merge_history import MergeHistoryEnsemble
+from spd.clustering.plotting.activations import plot_activations
+from spd.clustering.plotting.merge import plot_dists_distribution
+from spd.clustering.scripts.s1_split_dataset import split_dataset_lm
+from spd.models.component_model import ComponentModel, SPDRunInfo
+
+DEVICE: str = "cuda" if torch.cuda.is_available() else "cpu"
+
+# magic autoreload
+# %load_ext autoreload
+# %autoreload 2
+
+# %%
+# Load model and dataset
+# ============================================================
+MODEL_PATH: str = "wandb:goodfire/spd/runs/ioprgffh"
+
+_, DATA_CFG = split_dataset_lm(
+    model_path=MODEL_PATH,
+    n_batches=1,
+    batch_size=2,
+)
+DATASET_PATH: str = DATA_CFG["output_files"][0]
+
+SPD_RUN: SPDRunInfo = SPDRunInfo.from_path(MODEL_PATH)
+MODEL: ComponentModel = ComponentModel.from_pretrained(SPD_RUN.checkpoint_path)
+MODEL.to(DEVICE)
+SPD_CONFIG = SPD_RUN.config
+
+
+# %%
+# Load data batch
+# ============================================================
+DATA_BATCH: Int[Tensor, "batch_size n_ctx"] = torch.tensor(np.load(DATASET_PATH)["input_ids"])
+
+# %%
+# Get component activations
+# ============================================================
+COMPONENT_ACTS: dict[str, Tensor] = component_activations(
+    model=MODEL,
+    batch=DATA_BATCH,
+    device=DEVICE,
+    sigmoid_type="hard",
+)
+
+_ = dbg_auto(COMPONENT_ACTS)
+# %%
+# Process activations
+# ============================================================
+FILTER_DEAD_THRESHOLD: float = 0.001
+FILTER_MODULES: str = "model.layers.0"
+
+PROCESSED_ACTIVATIONS: ProcessedActivations = process_activations(
+    activations=COMPONENT_ACTS,
+    filter_dead_threshold=FILTER_DEAD_THRESHOLD,
+    filter_modules=lambda x: x.startswith(FILTER_MODULES),
+    seq_mode="concat",
+)
+
+plot_activations(
+    processed_activations=PROCESSED_ACTIVATIONS,
+    save_pdf=False,
+)
+
+# %%
+# Compute ensemble merge iterations
+# ============================================================
+MERGE_CFG: MergeConfig = MergeConfig(
+    activation_threshold=0.01,
+    alpha=0.01,
+    iters=2,
+    merge_pair_sampling_method="range",
+    merge_pair_sampling_kwargs={"threshold": 0.1},
+    pop_component_prob=0,
+    module_name_filter=FILTER_MODULES,
+    filter_dead_threshold=FILTER_DEAD_THRESHOLD,
+)
+
+ENSEMBLE: MergeHistoryEnsemble = merge_iteration_ensemble(
+    activations=PROCESSED_ACTIVATIONS.activations,
+    component_labels=PROCESSED_ACTIVATIONS.labels,
+    merge_config=MERGE_CFG,
+    ensemble_size=2,
+)
+
+
+# %%
+# Compute and plot distances
+# ============================================================
+DISTANCES = ENSEMBLE.get_distances()
+
+plot_dists_distribution(
+    distances=DISTANCES,
+    mode="points",
+)
+plt.legend()
diff --git a/tests/clustering/test_clustering_experiments.py b/tests/clustering/test_clustering_experiments.py
@@ -6,11 +6,15 @@
 
 import pytest
 
+# Test resource directories
+NOTEBOOK_DIR: Path = Path("tests/clustering/scripts")
+CONFIG_DIR: Path = Path("spd/clustering/configs")
+
 
 @pytest.mark.slow
 def test_cluster_resid_mlp_notebook():
     """Test running the cluster_resid_mlp.py notebook-style script."""
-    script_path = Path("spd/clustering/experiments/cluster_resid_mlp.py")
+    script_path = NOTEBOOK_DIR / "cluster_resid_mlp.py"
     assert script_path.exists(), f"Script not found: {script_path}"
 
     # Run the script as-is
@@ -30,7 +34,7 @@ def test_cluster_resid_mlp_notebook():
 @pytest.mark.slow
 def test_clustering_with_resid_mlp1_config():
     """Test running clustering with test-resid_mlp1.json config."""
-    config_path = Path("spd/clustering/configs/test-resid_mlp1.json")
+    config_path = CONFIG_DIR / "test-resid_mlp1.json"
     assert config_path.exists(), f"Config not found: {config_path}"
 
     # Run the clustering main script with the test config
@@ -54,7 +58,7 @@ def test_clustering_with_resid_mlp1_config():
 @pytest.mark.slow
 def test_cluster_ss_notebook():
     """Test running the cluster_ss.py notebook-style script."""
-    script_path = Path("spd/clustering/experiments/cluster_ss.py")
+    script_path = NOTEBOOK_DIR / "cluster_ss.py"
     assert script_path.exists(), f"Script not found: {script_path}"
 
     # Run the script as-is
@@ -74,7 +78,7 @@ def test_cluster_ss_notebook():
 @pytest.mark.slow
 def test_clustering_with_simplestories_config():
     """Test running clustering with test-simplestories.json config."""
-    config_path = Path("spd/clustering/configs/test-simplestories.json")
+    config_path = CONFIG_DIR / "test-simplestories.json"
     assert config_path.exists(), f"Config not found: {config_path}"
 
     # Run the clustering main script with the test config