Allow for toggling CV

EleutherAI · norabelrose · Apr 16, 2023 · Apr 4, 2023 · Apr 4, 2023 · Apr 4, 2023
commit f021404d66984a25f8f7a19d4af365bb69a44f82
diff --git a/elk/evaluation/evaluate.py b/elk/evaluation/evaluate.py
@@ -28,8 +28,7 @@ class Eval(Serializable):
  `elk.training.preprocessing.normalize()` for details.
  num_gpus: The number of GPUs to use. Defaults to -1, which means
  "use all available GPUs".
- skip_supervised: Whether to skip training the supervised classifier. Defaults to
- False.
+ skip_supervised: Whether to skip evaluation of the supervised classifier.
  debug: When in debug mode, a useful log file is saved to the memorably-named
  output directory. Defaults to False.
  """

diff --git a/elk/training/supervised.py b/elk/training/supervised.py
@@ -26,7 +26,7 @@ def evaluate_supervised(
  return assert_type(float, lr_auroc), assert_type(float, lr_acc)
 
 
-def train_supervised(data: dict[str, tuple], device: str) -> Classifier:
+def train_supervised(data: dict[str, tuple], device: str, cv: bool) -> Classifier:
  Xs, train_labels = [], []
 
  for x0, x1, labels, _ in data.values():
@@ -42,6 +42,9 @@ def train_supervised(data: dict[str, tuple], device: str) -> Classifier:
 
  X, train_labels = torch.cat(Xs), torch.cat(train_labels)
  lr_model = Classifier(X.shape[-1], device=device)
- lr_model.fit_cv(X, train_labels)
+ if cv:
+ lr_model.fit_cv(X, train_labels)
+ else:
+ lr_model.fit(X, train_labels)
 
  return lr_model
diff --git a/elk/training/train.py b/elk/training/train.py
@@ -3,7 +3,7 @@
 from dataclasses import dataclass
 from functools import partial
 from pathlib import Path
-from typing import Callable
+from typing import Callable, Literal
 
 import pandas as pd
 import torch
@@ -32,8 +32,9 @@ class Elicit(Serializable):
  "use all available GPUs".
  normalization: The normalization method to use. Defaults to "meanonly". See
  `elk.training.preprocessing.normalize()` for details.
- skip_supervised: Whether to skip training the supervised classifier. Defaults to
- False.
+ supervised: Whether to train a supervised classifier, and if so, whether to
+ use cross-validation. Defaults to "single", which means to train a single
+ classifier on the training data. "cv" means to use cross-validation.
  debug: When in debug mode, a useful log file is saved to the memorably-named
  output directory. Defaults to False.
  """
@@ -49,7 +50,7 @@ class Elicit(Serializable):
  min_gpu_mem: int | None = None
  num_gpus: int = -1
  out_dir: Path | None = None
- skip_supervised: bool = False
+ supervised: Literal["none", "single", "cv"] = "single"
 
  def execute(self):
  train_run = Train(cfg=self, out_dir=self.out_dir)
@@ -116,8 +117,10 @@ def train_reporter(
  torch.save(reporter, file)
 
  # Fit supervised logistic regression model
- if not self.cfg.skip_supervised:
- lr_model = train_supervised(train_dict, device=device)
+ if self.cfg.supervised != "none":
+ lr_model = train_supervised(
+ train_dict, device=device, cv=self.cfg.supervised == "cv"
+ )
  with open(lr_dir / f"layer_{layer}.pt", "wb") as file:
  torch.save(lr_model, file)
  else: