openai · jwang47 · Apr 12, 2023 · Apr 12, 2023 · Apr 12, 2023 · Apr 12, 2023
@@ -13,12 +13,14 @@ def __init__(
  self,
  completion_fns: list[CompletionFn],
  samples_jsonl: str,
+ ignore_case: bool = False,
  *args,
  **kwargs,
  ):
  super().__init__(completion_fns, *args, **kwargs)
  assert len(completion_fns) == 1, "Includes only supports one completion fn"
  self.samples_jsonl = samples_jsonl
+ self.ignore_case = ignore_case
 
  def eval_sample(self, sample: Any, *_):
  prompt = sample["input"]
@@ -27,7 +29,9 @@ def eval_sample(self, sample: Any, *_):
  )
  sampled = result.get_completions()[0]
 
- includes_answer = any([utils.get_answer(sampled, ref) for ref in sample["ideal"]])
+ includes_answer = any(
+ [utils.get_answer(sampled, ref, self.ignore_case) for ref in sample["ideal"]]
+ )
  evals.record.record_metrics(accuracy=float(includes_answer))
  return includes_answer
 

@@ -14,8 +14,12 @@
 )
 
 
-def get_answer(text, answer_prompt):
- idx = text.rfind(answer_prompt)
+def get_answer(text, answer_prompt, ignore_case=False):
+ if ignore_case:
+ idx = text.lower().rfind(answer_prompt.lower())
+ else:
+ idx = text.rfind(answer_prompt)
+
  if idx == -1:
  return None
  return text[idx + len(answer_prompt) :]

@@ -3,6 +3,7 @@ test:
  - test-match
  - test-fuzzy-match
  - test-includes
+ - test-includes-ignore-case
  - coqa-match
  - coqa-fact
  - coqa-fact-expl

@@ -3,3 +3,4 @@ test-basic:
  - test-match
  - test-fuzzy-match
  - test-includes
+ - test-includes-ignore-case
@@ -25,3 +25,13 @@ test-includes.s1.simple-v0:
  class: evals.elsuite.basic.includes:Includes
  args:
  samples_jsonl: test_fuzzy_match/samples.jsonl
+
+test-includes-ignore-case:
+ id: test-includes-ignore-case.s1.simple-v0
+ description: Example eval that uses fuzzy matching to score completions.
+ metrics: [accuracy]
+test-includes-ignore-case.s1.simple-v0:
+ class: evals.elsuite.basic.includes:Includes
+ args:
+ samples_jsonl: test_fuzzy_match/samples.jsonl
+ ignore_case: true