Skip to content

Commit 726bb9e

Browse files
committed
fix(topk activation): add keepdim=True to enable broadcasting; make dtype consistent without hardcode
1 parent 5240735 commit 726bb9e

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

src/lm_saes/evaluator.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,11 +4,11 @@
44
from torch import Tensor
55
from tqdm import tqdm
66
from transformer_lens import HookedTransformer
7+
from wandb.sdk.wandb_run import Run
78

89
from lm_saes.config import EvalConfig, MixCoderConfig, SAEConfig
910
from lm_saes.mixcoder import MixCoder
1011
from lm_saes.sae import SparseAutoEncoder
11-
from wandb.sdk.wandb_run import Run
1212

1313

1414
class Evaluator:

src/lm_saes/runner.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,11 +2,11 @@
22
from pathlib import Path
33
from typing import Literal, Optional, TypeVar, overload
44

5+
import wandb
56
from pydantic import model_validator
67
from pydantic_settings import BaseSettings, SettingsConfigDict
78
from torch.distributed.device_mesh import init_device_mesh
89

9-
import wandb
1010
from lm_saes.activation.factory import ActivationFactory
1111
from lm_saes.activation.writer import ActivationWriter
1212
from lm_saes.analysis.feature_analyzer import FeatureAnalyzer

src/lm_saes/trainer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,11 +7,11 @@
77
from torch import Tensor
88
from torch.optim import Adam, Optimizer
99
from tqdm import tqdm
10+
from wandb.sdk.wandb_run import Run
1011

1112
from lm_saes.config import TrainerConfig
1213
from lm_saes.optim import get_scheduler
1314
from lm_saes.sae import SparseAutoEncoder
14-
from wandb.sdk.wandb_run import Run
1515

1616

1717
class Trainer:

0 commit comments

Comments
 (0)