Rename EmbeddingDistance to EmbeddingSimilarity (#41)

Forgot to do this before landing 🤦
braintrustdata · Dec 15, 2023 · 31c0ee2 · 31c0ee2
1 parent 8a00ce6
commit 31c0ee2
Show file tree

Hide file tree

Showing 4 changed files with 23 additions and 13 deletions.
diff --git a/js/embeddings.test.ts b/js/embeddings.test.ts
@@ -1,4 +1,4 @@
-import { EmbeddingDistance } from "./string.js";
+import { EmbeddingSimilarity } from "./string.js";
 
 const SYNONYMS = [
   {
@@ -25,7 +25,7 @@ test("Embeddings Test", async () => {
   const prefix = "resource type: ";
   for (const { word, synonyms } of SYNONYMS) {
     for (const synonym of synonyms) {
-      const result = await EmbeddingDistance({
+      const result = await EmbeddingSimilarity({
         prefix,
         output: word,
         expected: synonym,
@@ -42,7 +42,7 @@ test("Embeddings Test", async () => {
 
       const word1 = UNRELATED[i];
       const word2 = UNRELATED[j];
-      const result = await EmbeddingDistance({
+      const result = await EmbeddingSimilarity({
         prefix,
         output: word1,
         expected: word2,

diff --git a/js/string.ts b/js/string.ts
@@ -28,7 +28,17 @@ export const LevenshteinScorer: Scorer<string, {}> = (args) => {
   };
 };
 
-export const EmbeddingDistance: Scorer<
+/**
+ * A scorer that uses cosine similarity to compare two strings.
+ *
+ * @param args
+ * @param args.prefix A prefix to prepend to the prompt. This is useful for specifying the domain of the inputs.
+ * @param args.model The model to use for the embedding distance. Defaults to "text-embedding-ada-002".
+ * @param args.expectedMin The minimum expected score. Defaults to 0.7. Values below this will be scored as 0, and
+ * values between this and 1 will be scaled linearly.
+ * @returns A score between 0 and 1, where 1 is a perfect match.
+ */
+export const EmbeddingSimilarity: Scorer<
   string,
   {
     prefix?: string;
@@ -37,7 +47,7 @@ export const EmbeddingDistance: Scorer<
   } & OpenAIAuth
 > = async (args) => {
   if (args.expected === undefined) {
-    throw new Error("EmbeddingDistance requires an expected value");
+    throw new Error("EmbeddingSimilarity requires an expected value");
   }
 
   const prefix = args.prefix ?? "";

diff --git a/py/autoevals/string.py b/py/autoevals/string.py
@@ -26,16 +26,16 @@ def _run_eval_sync(self, output, expected=None, **kwargs):
 LevenshteinScorer = Levenshtein  # backcompat
 
 
-class EmbeddingDistance(Scorer):
+class EmbeddingSimilarity(Scorer):
     """
-    A simple scorer that uses embedding distance to compare two strings.
+    A simple scorer that uses cosine similarity to compare two strings.
     """
 
     MODEL = "text-embedding-ada-002"
 
     def __init__(self, prefix="", model=MODEL, expected_min=0.7, api_key=None, base_url=None):
         """
-        Create a new EmbeddingDistance scorer.
+        Create a new EmbeddingSimilarity scorer.
 
         :param prefix: A prefix to prepend to the prompt. This is useful for specifying the domain of the inputs.
         :param model: The model to use for the embedding distance. Defaults to "text-embedding-ada-002".
@@ -53,7 +53,7 @@ def __init__(self, prefix="", model=MODEL, expected_min=0.7, api_key=None, base_
 
     async def _run_eval_async(self, output, expected=None, **kwargs):
         if expected is None:
-            raise ValueError("EmbeddingDistance requires an expected value")
+            raise ValueError("EmbeddingSimilarity requires an expected value")
 
         output_embedding_p = arun_cached_request(input=f"{self.prefix}{output}", **self.extra_args)
         expected_embedding_p = arun_cached_request(input=f"{self.prefix}{expected}", **self.extra_args)
@@ -69,7 +69,7 @@ async def _run_eval_async(self, output, expected=None, **kwargs):
 
     def _run_eval_sync(self, output, expected=None, **kwargs):
         if expected is None:
-            raise ValueError("EmbeddingDistance requires an expected value")
+            raise ValueError("EmbeddingSimilarity requires an expected value")
 
         output_result = run_cached_request("embed", input=f"{self.prefix}{output}", **self.extra_args)
         expected_result = run_cached_request("embed", input=f"{self.prefix}{expected}", **self.extra_args)
@@ -104,4 +104,4 @@ def cosine_similarity(list1, list2):
             return min(dot_product / (magnitude_list1 * magnitude_list2), 1)
 
 
-__all__ = ["LevenshteinScorer", "Levenshtein", "EmbeddingDistance"]
+__all__ = ["LevenshteinScorer", "Levenshtein", "EmbeddingSimilarity"]
diff --git a/py/autoevals/test_embeddings.py b/py/autoevals/test_embeddings.py
@@ -1,4 +1,4 @@
-from autoevals import EmbeddingDistance
+from autoevals import EmbeddingSimilarity
 
 SYNONYMS = [
     ("water", ["water", "H2O", "agua"]),
@@ -10,7 +10,7 @@
 
 
 def test_embeddings():
-    evaluator = EmbeddingDistance(prefix="resource type: ")
+    evaluator = EmbeddingSimilarity(prefix="resource type: ")
     for word, synonyms in SYNONYMS:
         for synonym in synonyms:
             result = evaluator(word, synonym)