From 235a9c5389de281438d2fc5f4a21081cddf3ec09 Mon Sep 17 00:00:00 2001
From: Damien BUTY <dam.buty@gmail.com>
Date: Thu, 11 Jul 2024 19:31:20 +0200
Subject: [PATCH 1/3] feat(instrumentation): make the openai instrumentation
 context aware

---
 src/api.ts                       | 106 ++++----
 src/instrumentation/index.ts     |  15 +-
 src/instrumentation/openai.ts    | 144 +++++------
 tests/integration/openai.test.ts | 408 +++++++++++++++++++++++--------
 4 files changed, 435 insertions(+), 238 deletions(-)

diff --git a/src/api.ts b/src/api.ts
index 13bed68..44e9761 100644
--- a/src/api.ts
+++ b/src/api.ts
@@ -696,70 +696,60 @@ export class API {
     orderBy?: GenerationsOrderBy;
   }): Promise<PaginatedResponse<PersistedGeneration>> {
     const query = `
-    query GetGenerations(
-      $after: ID,
-      $before: ID,
-      $cursorAnchor: DateTime,
-      $filters: [generationsInputType!],
-      $orderBy: GenerationsOrderByInput,
-      $first: Int,
-      $last: Int,
-      $projectId: String,
+      query GetGenerations(
+        $after: ID
+        $before: ID
+        $cursorAnchor: DateTime
+        $filters: [generationsInputType!]
+        $orderBy: GenerationsOrderByInput
+        $first: Int
+        $last: Int
+        $projectId: String
       ) {
-      generations(
-          after: $after,
-          before: $before,
-          cursorAnchor: $cursorAnchor,
-          filters: $filters,
-          orderBy: $orderBy,
-          first: $first,
-          last: $last,
-          projectId: $projectId,
-          ) {
+        generations(
+          after: $after
+          before: $before
+          cursorAnchor: $cursorAnchor
+          filters: $filters
+          orderBy: $orderBy
+          first: $first
+          last: $last
+          projectId: $projectId
+        ) {
           pageInfo {
-              startCursor
-              endCursor
-              hasNextPage
-              hasPreviousPage
+            startCursor
+            endCursor
+            hasNextPage
+            hasPreviousPage
           }
           totalCount
           edges {
-              cursor
-              node {
-                  id
-                  projectId
-                  prompt
-                  completion
-                  createdAt
-                  provider
-                  model
-                  variables
-                  messages
-                  messageCompletion
-                  tools
-                  settings
-                  stepId
-                  tokenCount
-                  duration
-                  inputTokenCount
-                  outputTokenCount
-                  ttFirstToken
-                  duration
-                  tokenThroughputInSeconds
-                  error
-                  type
-                  tags
-                  step {
-                      threadId
-                      thread {
-                      participant {
-                          identifier
-                              }
-                          }
-                      }
-                  }
-              }
+            cursor
+            node {
+              id
+              projectId
+              prompt
+              completion
+              createdAt
+              provider
+              model
+              variables
+              messages
+              messageCompletion
+              tools
+              settings
+              tokenCount
+              duration
+              inputTokenCount
+              outputTokenCount
+              ttFirstToken
+              tokenThroughputInSeconds
+              error
+              type
+              tags
+            }
           }
+        }
       }`;
 
     const result = await this.makeGqlCall(query, variables);
diff --git a/src/instrumentation/index.ts b/src/instrumentation/index.ts
index 6308d09..526bb2f 100644
--- a/src/instrumentation/index.ts
+++ b/src/instrumentation/index.ts
@@ -1,20 +1,15 @@
-import { LiteralClient, Step, Thread } from '..';
+import { LiteralClient } from '..';
 import { LiteralCallbackHandler } from './langchain';
 import { instrumentLlamaIndex, withThread } from './llamaindex';
-import instrumentOpenAI, {
-  InstrumentOpenAIOptions,
-  OpenAIOutput
-} from './openai';
+import instrumentOpenAI from './openai';
+import { InstrumentOpenAIOptions } from './openai';
 import { makeInstrumentVercelSDK } from './vercel-sdk';
 
 export type { InstrumentOpenAIOptions } from './openai';
 
 export default (client: LiteralClient) => ({
-  openai: (
-    output: OpenAIOutput,
-    parent?: Step | Thread,
-    options?: InstrumentOpenAIOptions
-  ) => instrumentOpenAI(client, output, parent, options),
+  openai: (options?: InstrumentOpenAIOptions) =>
+    instrumentOpenAI(client, options),
   langchain: {
     literalCallback: (threadId?: string) => {
       try {
diff --git a/src/instrumentation/openai.ts b/src/instrumentation/openai.ts
index 6bdce4f..b664527 100644
--- a/src/instrumentation/openai.ts
+++ b/src/instrumentation/openai.ts
@@ -18,26 +18,14 @@ import {
   Thread
 } from '..';
 
-const openaiReqs: Record<
-  string,
-  {
-    // Record the ID of the request
-    id: string;
-    // Record the start time of the request
-    start: number;
-    // Record the inputs of the request
-    inputs: Record<string, any>;
-    // Record the stream of the request if it's a streaming request
-    stream?: Stream<ChatCompletionChunk | Completion>;
-  }
-> = {};
-
 // Define a generic type for the original function to be wrapped
 type OriginalFunction<T extends any[], R> = (...args: T) => Promise<R>;
 
 // Utility function to wrap a method
 function wrapFunction<T extends any[], R>(
-  originalFunction: OriginalFunction<T, R>
+  originalFunction: OriginalFunction<T, R>,
+  client: LiteralClient,
+  options: InstrumentOpenAIOptions = {}
 ): OriginalFunction<T, R> {
   return async function (this: any, ...args: T): Promise<R> {
     const start = Date.now();
@@ -46,58 +34,57 @@ function wrapFunction<T extends any[], R>(
     const result = await originalFunction.apply(this, args);
 
     if (result instanceof Stream) {
-      const streamResult = result as Stream<ChatCompletionChunk | Completion>;
-      // If it is a streaming request, we need to process the first token to get the id
-      // However we also need to tee the stream so that the end developer can process the stream
-      const [a, b] = streamResult.tee();
-      // Re split the stream to store a clean instance for final processing later on
-      const c = a.tee()[0];
-      let id;
-      // Iterate over the stream to find the first chunk and store the id
-      for await (const chunk of a) {
-        id = chunk.id;
-        if (!openaiReqs[id]) {
-          openaiReqs[id] = {
-            id,
-            inputs: args[0],
-            start,
-            stream: c
-          };
-          break;
-        }
-      }
-      // @ts-expect-error Hacky way to add the id to the stream
-      b.id = id;
+      const streamResult = result;
+      const [returnedResult, processedResult] = streamResult.tee();
 
-      return b as any;
+      await processOpenAIOutput(client, processedResult, {
+        ...options,
+        start,
+        inputs: args[0]
+      });
+
+      return returnedResult as R;
     } else {
-      const regularResult = result as ChatCompletion | Completion;
-      const id = regularResult.id;
-      openaiReqs[id] = {
-        id,
-        inputs: args[0],
-        start
-      };
+      await processOpenAIOutput(client, result as ChatCompletion | Completion, {
+        ...options,
+        start,
+        inputs: args[0]
+      });
+
       return result;
     }
   };
 }
 
-// Patching the chat.completions.create function
-const originalChatCompletionsCreate = OpenAI.Chat.Completions.prototype.create;
-OpenAI.Chat.Completions.prototype.create = wrapFunction(
-  originalChatCompletionsCreate
-) as any;
-
-// Patching the completions.create function
-const originalCompletionsCreate = OpenAI.Completions.prototype.create;
-OpenAI.Completions.prototype.create = wrapFunction(
-  originalCompletionsCreate
-) as any;
-
-// Patching the completions.create function
-const originalImagesGenerate = OpenAI.Images.prototype.generate;
-OpenAI.Images.prototype.generate = wrapFunction(originalImagesGenerate) as any;
+function instrumentOpenAI(
+  client: LiteralClient,
+  options: InstrumentOpenAIOptions = {}
+) {
+  // Patching the chat.completions.create function
+  const originalChatCompletionsCreate =
+    OpenAI.Chat.Completions.prototype.create;
+  OpenAI.Chat.Completions.prototype.create = wrapFunction(
+    originalChatCompletionsCreate,
+    client,
+    options
+  ) as any;
+
+  // Patching the completions.create function
+  const originalCompletionsCreate = OpenAI.Completions.prototype.create;
+  OpenAI.Completions.prototype.create = wrapFunction(
+    originalCompletionsCreate,
+    client,
+    options
+  ) as any;
+
+  // Patching the completions.create function
+  const originalImagesGenerate = OpenAI.Images.prototype.generate;
+  OpenAI.Images.prototype.generate = wrapFunction(
+    originalImagesGenerate,
+    client,
+    options
+  ) as any;
+}
 
 function processChatDelta(
   newDelta: ChatCompletionChunk.Choice.Delta,
@@ -296,22 +283,39 @@ export interface InstrumentOpenAIOptions {
   tags?: Maybe<string[]>;
 }
 
-const instrumentOpenAI = async (
+export interface ProcessOpenAIOutput extends InstrumentOpenAIOptions {
+  start: number;
+  inputs: Record<string, any>;
+}
+
+const processOpenAIOutput = async (
   client: LiteralClient,
   output: OpenAIOutput,
-  parent?: Step | Thread,
-  options: InstrumentOpenAIOptions = {}
+  { start, tags, inputs }: ProcessOpenAIOutput
 ) => {
-  //@ts-expect-error - This is a hacky way to get the id from the stream
-  const outputId = output.id;
-  const { stream, start, inputs } = openaiReqs[outputId];
   const baseGeneration = {
     provider: 'openai',
     model: inputs.model,
     settings: getSettings(inputs),
-    tags: options.tags
+    tags: tags
   };
 
+  let threadFromStore: Thread | null = null;
+  try {
+    threadFromStore = client.getCurrentThread();
+  } catch (error) {
+    // Ignore error thrown if getCurrentThread is called outside of a context
+  }
+
+  let stepFromStore: Step | null = null;
+  try {
+    stepFromStore = client.getCurrentStep();
+  } catch (error) {
+    // Ignore error thrown if getCurrentStep is called outside of a context
+  }
+
+  const parent = stepFromStore || threadFromStore;
+
   if ('data' in output) {
     // Image Generation
 
@@ -322,7 +326,7 @@ const instrumentOpenAI = async (
       output: output,
       startTime: new Date(start).toISOString(),
       endTime: new Date().toISOString(),
-      tags: options.tags
+      tags: tags
     };
 
     const step = parent
@@ -330,6 +334,8 @@ const instrumentOpenAI = async (
       : client.step({ ...stepData, type: 'run' });
     await step.send();
   } else if (output instanceof Stream) {
+    const stream = output as Stream<ChatCompletionChunk | Completion>;
+
     if (!stream) {
       throw new Error('Stream not found');
     }
@@ -460,8 +466,6 @@ const instrumentOpenAI = async (
       }
     }
   }
-
-  delete openaiReqs[outputId];
 };
 
 export default instrumentOpenAI;
diff --git a/tests/integration/openai.test.ts b/tests/integration/openai.test.ts
index a7231cf..25a0b89 100644
--- a/tests/integration/openai.test.ts
+++ b/tests/integration/openai.test.ts
@@ -1,130 +1,338 @@
 import 'dotenv/config';
 import OpenAI from 'openai';
+import { v4 as uuidv4 } from 'uuid';
 
-import { LiteralClient } from '../../src';
+import {
+  ChatGeneration,
+  LiteralClient,
+  Maybe,
+  OmitUtils,
+  Step
+} from '../../src';
+
+const url = process.env.LITERAL_API_URL;
+const apiKey = process.env.LITERAL_API_KEY;
+
+if (!url || !apiKey) {
+  throw new Error('Missing environment variables');
+}
+
+const openai = new OpenAI();
 
 // Skip for the CI
-describe.skip('OpenAI Instrumentation', () => {
-  let client: LiteralClient;
+describe('OpenAI Instrumentation', () => {
+  beforeAll(function () {});
 
-  beforeAll(function () {
-    const url = process.env.LITERAL_API_URL;
-    const apiKey = process.env.LITERAL_API_KEY;
+  describe('Outside of a thread or step wrapper', () => {
+    describe('Simple chat generation', () => {
+      let step: Maybe<Step>;
+      let generationFromStep: OmitUtils<ChatGeneration>;
+      let response: OpenAI.ChatCompletion;
 
-    if (!url || !apiKey) {
-      throw new Error('Missing environment variables');
-    }
+      beforeAll(async () => {
+        const testId = uuidv4();
 
-    client = new LiteralClient(apiKey, url);
-  });
+        const client = new LiteralClient(apiKey, url);
+        client.instrumentation.openai({ tags: [testId] });
+
+        response = await openai.chat.completions.create({
+          model: 'gpt-3.5-turbo',
+          messages: [
+            { role: 'system', content: 'You are a helpful assistant.' },
+            { role: 'user', content: 'What is the capital of Canada?' }
+          ]
+        });
 
-  it('should monitor simple generation', async () => {
-    const spy = jest.spyOn(client.api, 'createGeneration');
+        const {
+          data: [generation]
+        } = await client.api.getGenerations({
+          filters: [
+            {
+              field: 'tags',
+              operator: 'in',
+              value: [testId]
+            }
+          ]
+        });
 
-    const openai = new OpenAI();
+        step = await client.api.getStep(generation.id);
+        generationFromStep = step!.generation!;
+      });
 
-    const response = await openai.chat.completions.create({
-      model: 'gpt-3.5-turbo',
-      messages: [
-        { role: 'system', content: 'You are a helpful assistant.' },
-        { role: 'user', content: 'What is the capital of Canada?' }
-      ]
+      it('should create a generation with no thread or parent', async () => {
+        expect(step?.threadId).toBeNull();
+        expect(step?.parentId).toBeNull();
+        expect(step?.type).toBe('llm');
+      });
+
+      it("should log a generation's input & output", async () => {
+        expect(generationFromStep.messages).toEqual([
+          {
+            role: 'system',
+            content: 'You are a helpful assistant.'
+          },
+          {
+            role: 'user',
+            content: 'What is the capital of Canada?'
+          }
+        ]);
+        expect(generationFromStep.messageCompletion).toEqual({
+          role: 'assistant',
+          content: response.choices[0].message.content
+        });
+      });
+
+      it("should log a generation's settings", async () => {
+        expect(generationFromStep.provider).toBe('openai');
+        expect(generationFromStep.model).toContain('gpt-3.5-turbo');
+        expect(generationFromStep.tokenCount).toEqual(expect.any(Number));
+        expect(generationFromStep.inputTokenCount).toEqual(expect.any(Number));
+        expect(generationFromStep.outputTokenCount).toEqual(expect.any(Number));
+      });
     });
 
-    await client.instrumentation.openai(response);
-
-    expect(response.choices[0].message.content).toBeTruthy();
-
-    expect(spy).toHaveBeenCalledWith(
-      expect.objectContaining({
-        type: 'CHAT',
-        provider: 'openai',
-        model: 'gpt-3.5-turbo-0125',
-        messages: [
-          { content: 'You are a helpful assistant.', role: 'system' },
-          { content: 'What is the capital of Canada?', role: 'user' }
-        ],
-        messageCompletion: response.choices[0].message,
-        tokenCount: expect.any(Number)
-      })
-    );
-  });
+    describe('Streamed chat generation', () => {
+      let step: Maybe<Step>;
+      let generationFromStep: OmitUtils<ChatGeneration>;
+      let resultText = '';
 
-  it('should monitor streamed generation', async () => {
-    const spy = jest.spyOn(client.api, 'createGeneration');
+      beforeAll(async () => {
+        const testId = uuidv4();
 
-    const openai = new OpenAI();
+        const client = new LiteralClient(apiKey, url);
+        client.instrumentation.openai({ tags: [testId] });
 
-    const response = await openai.chat.completions.create({
-      model: 'gpt-3.5-turbo',
-      messages: [
-        { role: 'system', content: 'You are a helpful assistant.' },
-        { role: 'user', content: 'What is the capital of Switzerland?' }
-      ],
-      stream: true
-    });
+        const response = await openai.chat.completions.create({
+          model: 'gpt-3.5-turbo',
+          messages: [
+            { role: 'system', content: 'You are a helpful assistant.' },
+            { role: 'user', content: 'What is the capital of Canada?' }
+          ],
+          stream: true
+        });
+
+        const {
+          data: [generation]
+        } = await client.api.getGenerations({
+          filters: [
+            {
+              field: 'tags',
+              operator: 'in',
+              value: [testId]
+            }
+          ]
+        });
+
+        for await (const chunk of response) {
+          resultText += chunk.choices[0].delta.content ?? '';
+        }
+
+        step = await client.api.getStep(generation.id);
+        generationFromStep = step!.generation!;
+      });
+
+      it('should create a generation with no thread or parent', async () => {
+        expect(step?.threadId).toBeNull();
+        expect(step?.parentId).toBeNull();
+        expect(step?.type).toBe('llm');
+      });
 
-    await client.instrumentation.openai(response);
-
-    let resultText = '';
-    // use stream as an async iterable:
-    for await (const chunk of response) {
-      resultText += chunk.choices[0].delta.content ?? '';
-    }
-
-    expect(resultText).toBeTruthy();
-
-    expect(spy).toHaveBeenCalledWith(
-      expect.objectContaining({
-        type: 'CHAT',
-        provider: 'openai',
-        model: 'gpt-3.5-turbo-0125',
-        messages: [
-          { content: 'You are a helpful assistant.', role: 'system' },
-          { content: 'What is the capital of Switzerland?', role: 'user' }
-        ],
-        messageCompletion: {
+      it("should log a generation's input & output", async () => {
+        expect(generationFromStep.messages).toEqual([
+          {
+            role: 'system',
+            content: 'You are a helpful assistant.'
+          },
+          {
+            role: 'user',
+            content: 'What is the capital of Canada?'
+          }
+        ]);
+        expect(generationFromStep.messageCompletion).toEqual({
           role: 'assistant',
           content: resultText
-        },
-        duration: expect.any(Number),
-        ttFirstToken: expect.any(Number),
-        outputTokenCount: expect.any(Number),
-        tokenThroughputInSeconds: expect.any(Number)
-      })
-    );
+        });
+      });
+
+      it("should log a generation's settings", async () => {
+        expect(generationFromStep.provider).toBe('openai');
+        expect(generationFromStep.model).toContain('gpt-3.5-turbo');
+        expect(generationFromStep.tokenCount).toEqual(expect.any(Number));
+        expect(generationFromStep.inputTokenCount).toEqual(expect.any(Number));
+        expect(generationFromStep.outputTokenCount).toEqual(expect.any(Number));
+      });
+    });
+
+    describe('Image generation', () => {
+      it('should monitor image generation', async () => {
+        const testId = uuidv4();
+
+        const client = new LiteralClient(apiKey, url);
+        client.instrumentation.openai({ tags: [testId] });
+
+        const response = await openai.images.generate({
+          prompt: 'A painting of a rose in the style of Picasso.',
+          model: 'dall-e-2',
+          size: '256x256',
+          n: 1
+        });
+
+        const {
+          data: [step]
+        } = await client.api.getSteps({
+          first: 1,
+          filters: [
+            {
+              field: 'tags',
+              operator: 'in',
+              value: [testId]
+            }
+          ]
+        });
+
+        expect(step?.threadId).toBeNull();
+        expect(step?.parentId).toBeNull();
+        expect(step?.type).toBe('run');
+
+        expect(step?.output?.data[0].url).toEqual(response.data[0].url);
+      }, 30000);
+    });
   });
 
-  it('should monitor image generation', async () => {
-    const spy = jest.spyOn(client.api, 'sendSteps');
+  describe('Inside of a thread or step wrapper', () => {
+    it('logs the generation inside its thread and parent', async () => {
+      const testId = uuidv4();
+
+      const client = new LiteralClient(apiKey, url);
+      client.instrumentation.openai({ tags: [testId] });
+
+      let threadId: Maybe<string>;
+      let parentId: Maybe<string>;
+
+      await client.thread({ name: 'openai' }).wrap(async () => {
+        threadId = client.getCurrentThread().id;
+        return client.run({ name: 'openai' }).wrap(async () => {
+          parentId = client.getCurrentStep().id;
+
+          await openai.chat.completions.create({
+            model: 'gpt-3.5-turbo',
+            messages: [
+              { role: 'system', content: 'You are a helpful assistant.' },
+              { role: 'user', content: 'What is the capital of Canada?' }
+            ]
+          });
+        });
+      });
 
-    const openai = new OpenAI();
+      const {
+        data: [step]
+      } = await client.api.getSteps({
+        first: 1,
+        filters: [
+          {
+            field: 'tags',
+            operator: 'in',
+            value: [testId]
+          }
+        ]
+      });
 
-    const response = await openai.images.generate({
-      prompt: 'A painting of a rose in the style of Picasso.',
-      model: 'dall-e-2',
-      size: '256x256',
-      n: 1
+      expect(step?.threadId).toBe(threadId);
+      expect(step?.parentId).toBe(parentId);
     });
 
-    await client.instrumentation.openai(response);
+    it("doesn't mix up threads and steps", async () => {
+      const testId = uuidv4();
 
-    expect(response.data[0].url).toBeTruthy();
+      const client = new LiteralClient(apiKey, url);
+      client.instrumentation.openai({ tags: [testId] });
 
-    expect(spy).toHaveBeenCalledWith(
-      expect.arrayContaining([
-        expect.objectContaining({
-          name: 'dall-e-2',
-          type: 'run',
-          input: {
-            model: 'dall-e-2',
-            prompt: 'A painting of a rose in the style of Picasso.',
-            size: '256x256',
-            n: 1
+      const firstThreadId = uuidv4();
+      const secondThreadId = uuidv4();
+
+      let firstStep: Maybe<Step>;
+      let secondStep: Maybe<Step>;
+
+      await Promise.all([
+        client
+          .thread({ id: firstThreadId, name: 'Thread 1' })
+          .wrap(async () => {
+            return client
+              .step({ name: 'Step 1', type: 'assistant_message' })
+              .wrap(async () => {
+                firstStep = client.getCurrentStep();
+
+                return openai.chat.completions.create({
+                  model: 'gpt-3.5-turbo',
+                  messages: [
+                    { role: 'system', content: 'You are a helpful assistant.' },
+                    { role: 'user', content: 'What is the capital of Canada?' }
+                  ]
+                });
+              });
+          }),
+        client
+          .thread({ id: secondThreadId, name: 'Thread 2' })
+          .wrap(async () => {
+            return client
+              .step({ name: 'Step 2', type: 'assistant_message' })
+              .wrap(async () => {
+                secondStep = client.getCurrentStep();
+
+                return openai.chat.completions.create({
+                  model: 'gpt-3.5-turbo',
+                  messages: [
+                    { role: 'system', content: 'You are a helpful assistant.' },
+                    { role: 'user', content: 'What is the capital of Canada?' }
+                  ]
+                });
+              });
+          })
+      ]);
+
+      const {
+        data: [firstGeneration]
+      } = await client.api.getSteps({
+        first: 1,
+        filters: [
+          {
+            field: 'threadId',
+            operator: 'eq',
+            value: firstThreadId!
           },
-          output: response
-        })
-      ])
-    );
+          {
+            field: 'tags',
+            operator: 'in',
+            value: [testId]
+          }
+        ]
+      });
+
+      const {
+        data: [secondGeneration]
+      } = await client.api.getSteps({
+        first: 1,
+        filters: [
+          {
+            field: 'threadId',
+            operator: 'eq',
+            value: secondThreadId!
+          },
+          {
+            field: 'tags',
+            operator: 'in',
+            value: [testId]
+          }
+        ]
+      });
+
+      expect(firstStep?.threadId).toEqual(firstThreadId);
+      expect(secondStep?.threadId).toEqual(secondThreadId);
+
+      expect(firstGeneration?.threadId).toEqual(firstThreadId);
+      expect(firstGeneration?.parentId).toEqual(firstStep?.id);
+      expect(secondGeneration?.threadId).toEqual(secondThreadId);
+      expect(secondGeneration?.parentId).toEqual(secondStep?.id);
+    }, 30000);
   });
 });

From 60c5e1069036e81ff6fe6a9443bbb9b5744d38f4 Mon Sep 17 00:00:00 2001
From: Damien BUTY <dam.buty@gmail.com>
Date: Mon, 15 Jul 2024 12:51:01 +0200
Subject: [PATCH 2/3] fix: mock openai calls

---
 src/api.ts                       |   2 +
 src/instrumentation/openai.ts    |  14 ++-
 tests/integration/openai.test.ts | 186 +++++++++++++++++++++----------
 3 files changed, 140 insertions(+), 62 deletions(-)

diff --git a/src/api.ts b/src/api.ts
index 44e9761..dd4426c 100644
--- a/src/api.ts
+++ b/src/api.ts
@@ -399,6 +399,7 @@ export class API {
 
       return response.data;
     } catch (e) {
+      console.error(e);
       if (e instanceof AxiosError) {
         throw new Error(JSON.stringify(e.response?.data.errors));
       } else {
@@ -426,6 +427,7 @@ export class API {
 
       return response.data;
     } catch (e) {
+      console.error(e);
       if (e instanceof AxiosError) {
         throw new Error(JSON.stringify(e.response?.data));
       } else {
diff --git a/src/instrumentation/openai.ts b/src/instrumentation/openai.ts
index b664527..f489c95 100644
--- a/src/instrumentation/openai.ts
+++ b/src/instrumentation/openai.ts
@@ -77,7 +77,7 @@ function instrumentOpenAI(
     options
   ) as any;
 
-  // Patching the completions.create function
+  // Patching the images.generate function
   const originalImagesGenerate = OpenAI.Images.prototype.generate;
   OpenAI.Images.prototype.generate = wrapFunction(
     originalImagesGenerate,
@@ -288,6 +288,16 @@ export interface ProcessOpenAIOutput extends InstrumentOpenAIOptions {
   inputs: Record<string, any>;
 }
 
+function isStream(obj: any): boolean {
+  return (
+    obj !== null &&
+    typeof obj === 'object' &&
+    typeof obj.pipe === 'function' &&
+    typeof obj.on === 'function' &&
+    typeof obj.read === 'function'
+  );
+}
+
 const processOpenAIOutput = async (
   client: LiteralClient,
   output: OpenAIOutput,
@@ -333,7 +343,7 @@ const processOpenAIOutput = async (
       ? parent.step(stepData)
       : client.step({ ...stepData, type: 'run' });
     await step.send();
-  } else if (output instanceof Stream) {
+  } else if (output instanceof Stream || isStream(output)) {
     const stream = output as Stream<ChatCompletionChunk | Completion>;
 
     if (!stream) {
diff --git a/tests/integration/openai.test.ts b/tests/integration/openai.test.ts
index 25a0b89..cfc4b7f 100644
--- a/tests/integration/openai.test.ts
+++ b/tests/integration/openai.test.ts
@@ -1,5 +1,6 @@
 import 'dotenv/config';
 import OpenAI from 'openai';
+import { PassThrough } from 'stream';
 import { v4 as uuidv4 } from 'uuid';
 
 import {
@@ -21,94 +22,163 @@ const openai = new OpenAI();
 
 // Skip for the CI
 describe('OpenAI Instrumentation', () => {
-  beforeAll(function () {});
-
-  describe('Outside of a thread or step wrapper', () => {
-    describe('Simple chat generation', () => {
-      let step: Maybe<Step>;
-      let generationFromStep: OmitUtils<ChatGeneration>;
-      let response: OpenAI.ChatCompletion;
+  // Mock OpenAI Calls
+  beforeAll(() => {
+    /* @ts-expect-error the mock is incomplete but that's OK */
+    OpenAI.Chat.Completions.prototype.create = jest.fn(
+      ({ stream }: { stream: boolean }) => {
+        if (stream) {
+          const generationId = uuidv4();
+          const stream = new PassThrough({ objectMode: true });
+
+          stream.write({
+            id: generationId,
+            object: 'chat.completion.chunk',
+            choices: [
+              {
+                delta: { role: 'assistant', content: 'Ottawa' },
+                index: 0,
+                finish_reason: null
+              }
+            ]
+          });
 
-      beforeAll(async () => {
-        const testId = uuidv4();
+          stream.write({
+            id: generationId,
+            object: 'chat.completion.chunk',
+            choices: [
+              {
+                delta: { role: 'assistant', content: ' is' },
+                index: 0,
+                finish_reason: null
+              }
+            ]
+          });
 
-        const client = new LiteralClient(apiKey, url);
-        client.instrumentation.openai({ tags: [testId] });
+          stream.end({
+            id: generationId,
+            object: 'chat.completion.chunk',
+            choices: [
+              {
+                delta: { role: 'assistant', content: ' the capital of Canada' },
+                index: 0,
+                finish_reason: 'stop'
+              }
+            ]
+          });
 
-        response = await openai.chat.completions.create({
-          model: 'gpt-3.5-turbo',
-          messages: [
-            { role: 'system', content: 'You are a helpful assistant.' },
-            { role: 'user', content: 'What is the capital of Canada?' }
-          ]
-        });
+          return stream;
+        }
 
-        const {
-          data: [generation]
-        } = await client.api.getGenerations({
-          filters: [
+        return Promise.resolve({
+          id: uuidv4(),
+          object: 'chat.completion',
+          choices: [
             {
-              field: 'tags',
-              operator: 'in',
-              value: [testId]
+              message: {
+                role: 'assistant',
+                content: 'Ottawa is the capital of Canada'
+              }
             }
           ]
         });
+      }
+    );
 
-        step = await client.api.getStep(generation.id);
-        generationFromStep = step!.generation!;
+    /* @ts-expect-error the mock is incomplete but that's OK */
+    OpenAI.Images.prototype.generate = jest.fn(() => {
+      return Promise.resolve({
+        data: [{ url: 'https://example.com/image.png' }]
       });
+    });
+  });
 
-      it('should create a generation with no thread or parent', async () => {
-        expect(step?.threadId).toBeNull();
-        expect(step?.parentId).toBeNull();
-        expect(step?.type).toBe('llm');
+  describe('Streamed chat generation', () => {
+    let step: Maybe<Step>;
+    let generationFromStep: OmitUtils<ChatGeneration>;
+
+    beforeAll(async () => {
+      const testId = uuidv4();
+
+      const client = new LiteralClient(apiKey, url);
+      client.instrumentation.openai({ tags: [testId] });
+
+      await openai.chat.completions.create({
+        model: 'gpt-3.5-turbo',
+        messages: [
+          { role: 'system', content: 'You are a helpful assistant.' },
+          { role: 'user', content: 'What is the capital of Canada?' }
+        ],
+        stream: true
       });
 
-      it("should log a generation's input & output", async () => {
-        expect(generationFromStep.messages).toEqual([
-          {
-            role: 'system',
-            content: 'You are a helpful assistant.'
-          },
+      const {
+        data: [generation]
+      } = await client.api.getGenerations({
+        filters: [
           {
-            role: 'user',
-            content: 'What is the capital of Canada?'
+            field: 'tags',
+            operator: 'in',
+            value: [testId]
           }
-        ]);
-        expect(generationFromStep.messageCompletion).toEqual({
-          role: 'assistant',
-          content: response.choices[0].message.content
-        });
+        ]
       });
 
-      it("should log a generation's settings", async () => {
-        expect(generationFromStep.provider).toBe('openai');
-        expect(generationFromStep.model).toContain('gpt-3.5-turbo');
-        expect(generationFromStep.tokenCount).toEqual(expect.any(Number));
-        expect(generationFromStep.inputTokenCount).toEqual(expect.any(Number));
-        expect(generationFromStep.outputTokenCount).toEqual(expect.any(Number));
+      step = await client.api.getStep(generation.id);
+      generationFromStep = step!.generation!;
+    });
+
+    it('should create a generation with no thread or parent', async () => {
+      expect(step?.threadId).toBeNull();
+      expect(step?.parentId).toBeNull();
+      expect(step?.type).toBe('llm');
+    });
+
+    it("should log a generation's input & output", async () => {
+      expect(generationFromStep.messages).toEqual([
+        {
+          role: 'system',
+          content: 'You are a helpful assistant.'
+        },
+        {
+          role: 'user',
+          content: 'What is the capital of Canada?'
+        }
+      ]);
+      expect(generationFromStep.messageCompletion).toEqual({
+        role: 'assistant',
+        content: 'Ottawa is the capital of Canada'
       });
     });
 
-    describe('Streamed chat generation', () => {
+    it("should log a generation's settings", async () => {
+      expect(generationFromStep.provider).toBe('openai');
+      expect(generationFromStep.model).toContain('gpt-3.5-turbo');
+      expect(generationFromStep.tokenCount).toEqual(expect.any(Number));
+      expect(generationFromStep.inputTokenCount).toEqual(expect.any(Number));
+      expect(generationFromStep.outputTokenCount).toEqual(expect.any(Number));
+    });
+  });
+
+  describe('Outside of a thread or step wrapper', () => {
+    describe('Simple chat generation', () => {
       let step: Maybe<Step>;
       let generationFromStep: OmitUtils<ChatGeneration>;
-      let resultText = '';
+      let response: OpenAI.ChatCompletion;
 
       beforeAll(async () => {
         const testId = uuidv4();
 
         const client = new LiteralClient(apiKey, url);
+
         client.instrumentation.openai({ tags: [testId] });
 
-        const response = await openai.chat.completions.create({
+        response = await openai.chat.completions.create({
           model: 'gpt-3.5-turbo',
           messages: [
             { role: 'system', content: 'You are a helpful assistant.' },
             { role: 'user', content: 'What is the capital of Canada?' }
-          ],
-          stream: true
+          ]
         });
 
         const {
@@ -123,10 +193,6 @@ describe('OpenAI Instrumentation', () => {
           ]
         });
 
-        for await (const chunk of response) {
-          resultText += chunk.choices[0].delta.content ?? '';
-        }
-
         step = await client.api.getStep(generation.id);
         generationFromStep = step!.generation!;
       });
@@ -150,7 +216,7 @@ describe('OpenAI Instrumentation', () => {
         ]);
         expect(generationFromStep.messageCompletion).toEqual({
           role: 'assistant',
-          content: resultText
+          content: response.choices[0].message.content
         });
       });
 

From 3b156abd79de0f506bd182a675fdf9001253625b Mon Sep 17 00:00:00 2001
From: Damien BUTY <dam.buty@gmail.com>
Date: Mon, 15 Jul 2024 12:53:55 +0200
Subject: [PATCH 3/3] fix: mock api key

---
 tests/integration/openai.test.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/openai.test.ts b/tests/integration/openai.test.ts
index cfc4b7f..652e48e 100644
--- a/tests/integration/openai.test.ts
+++ b/tests/integration/openai.test.ts
@@ -18,7 +18,7 @@ if (!url || !apiKey) {
   throw new Error('Missing environment variables');
 }
 
-const openai = new OpenAI();
+const openai = new OpenAI({ apiKey: 'an-ocean-of-noise' });
 
 // Skip for the CI
 describe('OpenAI Instrumentation', () => {