EleutherAI · AlexTMallen · Aug 22, 2023 · Aug 22, 2023 · Aug 22, 2023 · Aug 22, 2023
diff --git a/elk/debug_logging.py b/elk/debug_logging.py
@@ -31,6 +31,9 @@ def save_debug_log(datasets: list[DatasetDictWithName], out_dir: Path) -> None:
  else:
  train_split, val_split = select_train_val_splits(ds)
 
+ if len(ds[val_split]) == 0:
+ logging.warning(f"Val split '{val_split}' is empty!")
+ continue
  text_questions = ds[val_split][0]["text_questions"]
  template_ids = ds[val_split][0]["variant_ids"]
  label = ds[val_split][0]["label"]

diff --git a/elk/extraction/extraction.py b/elk/extraction/extraction.py
@@ -65,6 +65,9 @@ class Extract(Serializable):
  binarize: bool = False
  """Whether to binarize the dataset labels for multi-class datasets."""
 
+ no_balance: bool = False
+ """Whether to disable balancing the dataset by label."""
+
  int8: bool = False
  """Whether to perform inference in mixed int8 precision with `bitsandbytes`."""
 
@@ -189,6 +192,7 @@ def extract_hiddens(
  num_shots=cfg.num_shots,
  split_type=split_type,
  template_path=cfg.template_path,
+ balance=not cfg.no_balance,
  rank=rank,
  world_size=world_size,
  seed=cfg.seed,

diff --git a/elk/extraction/prompt_loading.py b/elk/extraction/prompt_loading.py
@@ -21,6 +21,7 @@ def load_prompts(
  seed: int = 42,
  split_type: Literal["train", "val"] = "train",
  template_path: str | None = None,
+ balance: bool = True,
  rank: int = 0,
  world_size: int = 1,
 ) -> Iterator[dict]:
@@ -89,14 +90,14 @@ def load_prompts(
  else:
  fewshot_iter = None
 
- if label_column in ds.features:
+ if label_column in ds.features and balance:
  ds = BalancedSampler(
  ds.to_iterable_dataset(),
  set(label_choices),
  label_col=label_column,
  )
  else:
- if rank == 0:
+ if rank == 0 and balance:
  print("No label column found, not balancing")
  ds = ds.to_iterable_dataset()
 

diff --git a/elk/training/classifier.py b/elk/training/classifier.py
@@ -194,8 +194,8 @@ def inlp(
  the input dimension.
  y: Target tensor of shape (N,) for binary classification or (N, C) for
  multiclass classification, where C is the number of classes.
- max_iter: Maximum number of iterations to run. If `None`, run for the full
- dimension of the input.
+ max_iter: Maximum number of iterations to run. If `None`, run until the data
+ is linearly guarded (no linear classifier can extract information).
  tol: Tolerance for the loss function. The algorithm will stop when the loss
  is within `tol` of the entropy of the labels.
 
@@ -212,12 +212,11 @@ def inlp(
  p = y.float().mean()
  H = -p * torch.log(p) - (1 - p) * torch.log(1 - p)
 
- if max_iter is not None:
- d = min(d, max_iter)
+ max_iter = max_iter or d
 
  # Iterate until the loss is within epsilon of the entropy
  result = InlpResult()
- for _ in range(d):
+ for _ in range(max_iter):
  clf = cls(d, device=x.device, dtype=x.dtype)
  loss = clf.fit(x, y)
  result.classifiers.append(clf)

diff --git a/elk/training/supervised.py b/elk/training/supervised.py
@@ -6,7 +6,7 @@
 
 
 def train_supervised(
- data: dict[str, tuple], device: str, mode: str
+ data: dict[str, tuple], device: str, mode: str, max_inlp_iter: int | None = None
 ) -> list[Classifier]:
  Xs, train_labels = [], []
 
@@ -26,7 +26,7 @@ def train_supervised(
  lr_model.fit_cv(X, train_labels)
  return [lr_model]
  elif mode == "inlp":
- return Classifier.inlp(X, train_labels).classifiers
+ return Classifier.inlp(X, train_labels, max_inlp_iter).classifiers
  elif mode == "single":
  lr_model = Classifier(X.shape[-1], device=device)
  lr_model.fit(X, train_labels)

diff --git a/elk/training/train.py b/elk/training/train.py
@@ -34,6 +34,9 @@ class Elicit(Run):
  cross-validation. Defaults to "single", which means to train a single classifier
  on the training data. "cv" means to use cross-validation."""
 
+ max_inlp_iter: int | None = None
+ """Maximum number of iterations for Iterative Nullspace Projection (INLP)."""
+
  def create_models_dir(self, out_dir: Path):
  lr_dir = None
  lr_dir = out_dir / "lr_models"
@@ -124,6 +127,7 @@ def apply_to_layer(
  train_dict,
  device=device,
  mode=self.supervised,
+ max_inlp_iter=self.max_inlp_iter,
  )
  with open(lr_dir / f"layer_{layer}.pt", "wb") as file:
  torch.save(lr_models, file)