Skip to content

Commit c616c8d

Browse files
committed
Disable normalizer
1 parent 35ab164 commit c616c8d

3 files changed

Lines changed: 5 additions & 9 deletions

File tree

bergson/__main__.py

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -132,12 +132,6 @@ class Trackstar:
132132
trackstar_cfg: TrackstarConfig
133133

134134
def execute(self):
135-
if self.index_cfg.normalizer != "none":
136-
print(
137-
"Warning: using a normalizer. We have been unable to validate"
138-
"normalizers in our ablations. Use at your own risk. "
139-
)
140-
141135
trackstar(
142136
self.index_cfg, self.score_cfg, self.preprocess_cfg, self.trackstar_cfg
143137
)

bergson/config.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -160,8 +160,10 @@ class IndexConfig:
160160
processor_path: str = ""
161161
"""Path to a precomputed processor."""
162162

163-
normalizer: Literal["adafactor", "adam", "none"] = "none"
164-
"""Type of normalizer to use for the gradients."""
163+
normalizer: Literal["none"] = "none" # "adafactor", "adam",
164+
"""Type of normalizer to use for the gradients. We are disabling
165+
optimizers due to lack of empirical validation - contact Eleuther
166+
if you'd like to use them."""
165167

166168
skip_preconditioners: bool = False
167169
"""Whether to skip estimating preconditioner statistics"""

examples/exp_log.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,4 +50,4 @@ with lr schedule from double backwards, 1e-2
5050

5151
without weight decay
5252

53-
512 tok: LDS Spearman=0.9338
53+
512 tok: LDS Spearman=0.9338

0 commit comments

Comments
 (0)