From ae969bfadec6844d17c86284ab6a3afb19b8fa32 Mon Sep 17 00:00:00 2001
From: Farzad Abdolhosseini <farzad@fixie.ai>
Date: Wed, 19 Jul 2023 13:15:38 -0700
Subject: [PATCH] review comments + pulling changes from another PR

---
 .../src/batteries/constrained-output.tsx      | 67 ++++++++++++-------
 packages/ai-jsx/src/core/completion.tsx       | 10 ++-
 packages/ai-jsx/src/core/errors.ts            |  1 -
 packages/ai-jsx/src/lib/openai.tsx            |  5 +-
 packages/ai-jsx/src/lib/util.ts               |  7 ++
 .../examples/src/validated-generation.tsx     |  3 +-
 6 files changed, 59 insertions(+), 34 deletions(-)
diff --git a/packages/ai-jsx/src/batteries/constrained-output.tsx b/packages/ai-jsx/src/batteries/constrained-output.tsx
index 2b9ce4077..212851f35 100644
--- a/packages/ai-jsx/src/batteries/constrained-output.tsx
+++ b/packages/ai-jsx/src/batteries/constrained-output.tsx
@@ -13,10 +13,11 @@ import {
   ModelPropsWithChildren,
 } from '../core/completion.js';
 import yaml from 'js-yaml';
-import { AIJSXError, ErrorCode } from '../core/errors.js';
+import { AIJSXError, ErrorCode, ErrorBlame } from '../core/errors.js';
+import { Jsonifiable } from 'type-fest';
 import z from 'zod';
 import { zodToJsonSchema } from 'zod-to-json-schema';
-import untruncateJson from 'untruncate-json';
+import { patchedUntruncateJson } from '../lib/util.js';
 
 export type ObjectCompletion = ModelPropsWithChildren & {
   /** Validators are used to ensure that the final object looks as expected. */
@@ -27,6 +28,12 @@ export type ObjectCompletion = ModelPropsWithChildren & {
    *
    * @note To match OpenAI function definition specs, the schema must be a Zod object.
    * Arrays and other types should be wrapped in a top-level object in order to be used.
+   *
+   * For example, to describe a list of strings, the following is not accepted:
+   * `const schema: z.Schema = z.array(z.string())`
+   *
+   * Instead, you can wrap it in an object like so:
+   * `const schema: z.ZodObject = z.object({ arr: z.array(z.string()) })`
    */
   schema?: z.ZodObject<any>;
   /** Any output example to be shown to the model. */
@@ -88,13 +95,11 @@ export async function* JsonChatCompletion(
   { schema, ...props }: Omit<TypedObjectCompletionWithRetry, 'typeName' | 'parser' | 'partialResultCleaner'>,
   { render }: AI.ComponentContext
 ) {
-  if (schema) {
-    try {
-      return yield* render(<JsonChatCompletionFunctionCall schema={schema} {...props} />);
-    } catch (e: any) {
-      if (e.code !== ErrorCode.ChatModelDoesNotSupportFunctions) {
-        throw e;
-      }
+  try {
+    return yield* render(<JsonChatCompletionFunctionCall schema={schema ?? z.object({}).nonstrict()} {...props} />);
+  } catch (e: any) {
+    if (e.code !== ErrorCode.ChatModelDoesNotSupportFunctions) {
+      throw e;
     }
   }
   return yield* render(
@@ -102,8 +107,7 @@ export async function* JsonChatCompletion(
       {...props}
       typeName="JSON"
       parser={JSON.parse}
-      // TODO: can we remove .default?
-      partialResultCleaner={untruncateJson.default}
+      partialResultCleaner={patchedUntruncateJson}
     />
   );
 }
@@ -148,6 +152,16 @@ export async function* YamlChatCompletion(
   );
 }
 
+export class CompletionError extends AIJSXError {
+  constructor(
+    message: string,
+    public readonly blame: ErrorBlame,
+    public readonly metadata: Jsonifiable & { output: string; validationError: string }
+  ) {
+    super(message, ErrorCode.ModelOutputDidNotMatchConstraint, blame, metadata);
+  }
+}
+
 /**
  * A {@link ChatCompletion} component that constrains the output to be a valid object format (e.g. JSON/YAML).
  *
@@ -159,7 +173,7 @@ export async function* YamlChatCompletion(
  */
 async function* OneShotObjectCompletion(
   { children, typeName, validators, example, schema, parser, partialResultCleaner, ...props }: TypedObjectCompletion,
-  { render, logger }: AI.ComponentContext
+  { render }: AI.ComponentContext
 ) {
   // If a schema is provided, it is added to the list of validators as well as the prompt.
   const validatorsAndSchema = schema ? [schema.parse, ...(validators ?? [])] : validators ?? [];
@@ -170,9 +184,9 @@ async function* OneShotObjectCompletion(
       <SystemMessage>
         Respond with a {typeName} object that encodes your response.
         {schema
-          ? `The ${typeName} object should match this JSON Schema: ${JSON.stringify(zodToJsonSchema(schema))}`
+          ? `The ${typeName} object should match this JSON Schema: ${JSON.stringify(zodToJsonSchema(schema))}\n`
           : ''}
-        {example ? `For example: \n${example}` : ''}
+        {example ? `For example: ${example}\n` : ''}
         Respond with only the {typeName} object. Do not include any explanatory prose. Do not include ```
         {typeName.toLowerCase()} ``` code blocks.
       </SystemMessage>
@@ -191,11 +205,11 @@ async function* OneShotObjectCompletion(
       }
     } catch (e: any) {
       if (partial.done) {
-        logger.warn(
-          { output: partial.value, cleaned: partialResultCleaner ? str : undefined, errorMessage: e.message },
-          "ObjectCompletion failed. The final result either didn't parse or didn't validate."
-        );
-        throw e;
+        throw new CompletionError(`The model did not produce a valid ${typeName} object`, 'runtime', {
+          typeName,
+          output: partial.value,
+          validationError: e.message,
+        });
       }
       continue;
     }
@@ -230,7 +244,8 @@ async function* ObjectCompletionWithRetry(
     output = yield* render(childrenWithCompletion);
     return output;
   } catch (e: any) {
-    validationError = e.message;
+    validationError = e.metadata.validationError;
+    output = e.metadata.output;
   }
 
   logger.debug({ atempt: 1, expectedFormat: props.typeName, output }, `Output did not validate to ${props.typeName}.`);
@@ -244,9 +259,10 @@ async function* ObjectCompletionWithRetry(
         <AssistantMessage>{output}</AssistantMessage>
         <UserMessage>
           Try again. Here's the validation error when trying to parse the output as {props.typeName}:{'\n'}
+          ```log filename="error.log"{'\n'}
           {validationError}
-          {'\n'}
-          You must reformat the string to be a valid {props.typeName} object, but you must keep the same data.
+          {'\n```\n'}
+          You must reformat your previous output to be a valid {props.typeName} object, but you must keep the same data.
         </UserMessage>
       </OneShotObjectCompletion>
     );
@@ -255,7 +271,8 @@ async function* ObjectCompletionWithRetry(
       output = yield* render(completionRetry);
       return output;
     } catch (e: any) {
-      validationError = e.message;
+      validationError = e.metadata.validationError;
+      output = e.metadata.output;
     }
 
     logger.debug(
@@ -264,14 +281,14 @@ async function* ObjectCompletionWithRetry(
     );
   }
 
-  throw new AIJSXError(
+  throw new CompletionError(
     `The model did not produce a valid ${props.typeName} object, even after ${retries} attempts.`,
-    ErrorCode.ModelOutputDidNotMatchConstraint,
     'runtime',
     {
       typeName: props.typeName,
       retries,
       output,
+      validationError,
     }
   );
 }
diff --git a/packages/ai-jsx/src/core/completion.tsx b/packages/ai-jsx/src/core/completion.tsx
index 66d9d5850..f5f1e6d84 100644
--- a/packages/ai-jsx/src/core/completion.tsx
+++ b/packages/ai-jsx/src/core/completion.tsx
@@ -48,10 +48,8 @@ export interface FunctionDefinition {
 /**
  * This function creates a [JSON Schema](https://json-schema.org/) object to describe
  * parameters for a {@link FunctionDefinition}.
- * The parameters can be described either using a record of parameter names to
- * {@link PlainFunctionParameter} objects, or using a {@link z.ZodObject} schema object.
  *
- * @note If using a Zod schema, the top-level schema must be an object as per OpenAI specifications.
+ * See {@link FunctionParameters} for more information on what parameters are supported.
  */
 export function getParametersSchema(parameters: FunctionParameters) {
   if (parameters instanceof z.ZodObject) {
@@ -90,6 +88,12 @@ export interface PlainFunctionParameter {
  *
  * @note If using a Zod schema, the top-level schema must be an object as per OpenAI specifications:
  * https://platform.openai.com/docs/api-reference/chat/create#chat/create-parameters
+ *
+ * For example, to describe a list of strings, the following is not accepted:
+ * `const schema: z.Schema = z.array(z.string())`
+ *
+ * Instead, you can wrap it in an object like so:
+ * `const schema: z.ZodObject = z.object({ arr: z.array(z.string()) })`
  */
 export type FunctionParameters = Record<string, PlainFunctionParameter> | z.ZodObject<any>;
 
diff --git a/packages/ai-jsx/src/core/errors.ts b/packages/ai-jsx/src/core/errors.ts
index 386b671df..95d298aeb 100644
--- a/packages/ai-jsx/src/core/errors.ts
+++ b/packages/ai-jsx/src/core/errors.ts
@@ -26,7 +26,6 @@ export enum ErrorCode {
   AnthropicAPIError = 1021,
   ChatModelDoesNotSupportFunctions = 1022,
   ChatCompletionBadInput = 1023,
-  InvalidParamSchemaType = 1024,
 
   ModelOutputDidNotMatchConstraint = 2000,
 
diff --git a/packages/ai-jsx/src/lib/openai.tsx b/packages/ai-jsx/src/lib/openai.tsx
index ac3406915..555b85666 100644
--- a/packages/ai-jsx/src/lib/openai.tsx
+++ b/packages/ai-jsx/src/lib/openai.tsx
@@ -35,9 +35,8 @@ import GPT3Tokenizer from 'gpt3-tokenizer';
 import { Merge, MergeExclusive } from 'type-fest';
 import { Logger } from '../core/log.js';
 import { HttpError, AIJSXError, ErrorCode } from '../core/errors.js';
-import { getEnvVar } from './util.js';
+import { getEnvVar, patchedUntruncateJson } from './util.js';
 import { ChatOrCompletionModelOrBoth } from './model.js';
-import untruncateJson from 'untruncate-json';
 
 // https://platform.openai.com/docs/models/model-endpoint-compatibility
 type ValidCompletionModel =
@@ -437,7 +436,7 @@ export async function* OpenAIChatModel(
       if (props.experimental_streamFunctionCallOnly) {
         yield JSON.stringify({
           ...currentMessage.function_call,
-          arguments: JSON.parse(untruncateJson.default(currentMessage.function_call.arguments || '{}')),
+          arguments: JSON.parse(patchedUntruncateJson(currentMessage.function_call.arguments || '{}')),
         });
       }
     }
diff --git a/packages/ai-jsx/src/lib/util.ts b/packages/ai-jsx/src/lib/util.ts
index fa6b821ea..81ef9c6e1 100644
--- a/packages/ai-jsx/src/lib/util.ts
+++ b/packages/ai-jsx/src/lib/util.ts
@@ -1,3 +1,4 @@
+import untruncateJson from 'untruncate-json';
 import { AIJSXError } from '../core/errors.js';
 
 /** @hidden */
@@ -14,3 +15,9 @@ export function getEnvVar(name: string, shouldThrow: boolean = true) {
   }
   return result;
 }
+
+/**
+ * There's an ESM issue with untruncate-json, so we need to do this to support running on both client & server.
+ */
+/** @hidden */
+export const patchedUntruncateJson = 'default' in untruncateJson ? untruncateJson.default : untruncateJson;
diff --git a/packages/examples/src/validated-generation.tsx b/packages/examples/src/validated-generation.tsx
index a0486ccf0..1b6235ffa 100644
--- a/packages/examples/src/validated-generation.tsx
+++ b/packages/examples/src/validated-generation.tsx
@@ -32,5 +32,4 @@ function App() {
   );
 }
 
-// showInspector(<App />);
-console.log(await AI.createRenderContext().render(<App />));
+showInspector(<App />);