langwatch · drewdrewthis · Jun 4, 2026 · Jun 4, 2026
diff --git a/javascript/examples/vitest/tests/helpers/openai-voice-agent.test.ts b/javascript/examples/vitest/tests/helpers/openai-voice-agent.test.ts
@@ -18,9 +18,12 @@ import { encodeAudioToBase64 } from "./audio-encoding";
 import { getFixturePath } from "./fixture-utils";
 import { OpenAiVoiceAgent } from "./openai-voice-agent";
 
-// Skipped in CI: depends on the OpenAI `gpt-4o-audio-preview` model, which
-// returns 404 model_not_found as of 2026-05-19. Tracked separately — the
-// voice work PR will unskip these tests once model access is restored.
+// Skipped in CI: live end-to-end test — calls OpenAI's `gpt-audio-mini` audio
+// model and the real LangWatch backend (cost, API keys, non-deterministic
+// audio), so it runs live/locally rather than in CI. The skip historically
+// also guarded the now-deleted `gpt-4o-audio-preview` (404 model_not_found
+// since 2026-05-19); #607 swapped that dead model for `gpt-audio-mini`, so the
+// model is no longer the blocker — the skip is CI-cost/live-only now.
 const skipInCi = process.env.CI === "true";
 
 /**

diff --git a/javascript/examples/vitest/tests/helpers/openai-voice-agent.ts b/javascript/examples/vitest/tests/helpers/openai-voice-agent.ts
@@ -6,7 +6,7 @@
  * - Generate audio output (voice responses)
  * - Handle multi-turn voice conversations
  *
- * Uses OpenAI's gpt-4o-audio-preview model which supports voice-to-voice interaction.
+ * Uses OpenAI's gpt-audio-mini model which supports voice-to-voice interaction.
  *
  * Example usage:
  * ```typescript
@@ -128,7 +128,7 @@ ${this.constructor.name} TEXT FALLBACK
   /**
    * Calls OpenAI's audio-enabled model to generate voice response
    *
-   * Uses gpt-4o-audio-preview with:
+   * Uses gpt-audio-mini with:
    * - Text and audio modalities
    * - WAV format output
    * - Configured voice (alloy, nova, echo, etc.)
@@ -138,7 +138,7 @@ ${this.constructor.name} TEXT FALLBACK
     messages: ChatCompletionMessageParam[]
   ): Promise<ChatCompletion> {
     return this.openai.chat.completions.create({
-      model: "gpt-4o-audio-preview",
+      model: "gpt-audio-mini",
       modalities: ["text", "audio"],
       audio: { voice: this.config.voice, format: "wav" },
       messages: this.systemMessage

diff --git a/javascript/examples/vitest/tests/multimodal-audio-to-audio.test.ts b/javascript/examples/vitest/tests/multimodal-audio-to-audio.test.ts
@@ -9,9 +9,12 @@ import {
 } from "./helpers";
 import { OpenAiVoiceAgent } from "./helpers/openai-voice-agent";
 
-// Skipped in CI: depends on the OpenAI `gpt-4o-audio-preview` model, which
-// returns 404 model_not_found as of 2026-05-19. Tracked separately — the
-// voice work PR will unskip these tests once model access is restored.
+// Skipped in CI: live end-to-end test — calls OpenAI's `gpt-audio-mini` audio
+// model and the real LangWatch backend (cost, API keys, non-deterministic
+// audio), so it runs live/locally rather than in CI. The skip historically
+// also guarded the now-deleted `gpt-4o-audio-preview` (404 model_not_found
+// since 2026-05-19); #607 swapped that dead model for `gpt-audio-mini`, so the
+// model is no longer the blocker — the skip is CI-cost/live-only now.
 const skipInCi = process.env.CI === "true";
 
 class AudioAgent extends OpenAiVoiceAgent {

diff --git a/javascript/examples/vitest/tests/multimodal-audio-to-text.test.ts b/javascript/examples/vitest/tests/multimodal-audio-to-text.test.ts
@@ -15,9 +15,12 @@ import {
 } from "./helpers";
 import { convertModelMessagesToOpenAIMessages } from "./helpers/convert-core-messages-to-openai";
 
-// CI-skipped: this test still pins `gpt-4o-audio-preview` (deleted, 404 since 2026-05-19) on line 48.
-// The model swap → gpt-audio-mini and the skip-marker removal are tracked in PR #607 (not yet merged).
-// This commit (#606) relaxes the judge criteria below so they're robust once that model swap lands.
+// Skipped in CI: live end-to-end test — calls OpenAI's `gpt-audio-mini` audio
+// model and the real LangWatch backend (cost, API keys, non-deterministic
+// audio), so it runs live/locally rather than in CI. The skip historically
+// also guarded the now-deleted `gpt-4o-audio-preview` (404 model_not_found
+// since 2026-05-19); #607 swapped that dead model for `gpt-audio-mini`, so the
+// model is no longer the blocker — the skip is CI-cost/live-only now.
 const skipInCi = process.env.CI === "true";
 
 class AudioAgent extends AgentAdapter {
@@ -45,7 +48,7 @@ class AudioAgent extends AgentAdapter {
 
   private async respond(messages: ChatCompletionMessageParam[]) {
     return await this.openai.chat.completions.create({
-      model: "gpt-4o-audio-preview",
+      model: "gpt-audio-mini",
       modalities: ["text", "audio"],
       audio: { voice: "alloy", format: "wav" },
       // We need to strip the id, or the openai client will throw an error

diff --git a/javascript/examples/vitest/tests/multimodal-voice-to-voice-conversation.test.ts b/javascript/examples/vitest/tests/multimodal-voice-to-voice-conversation.test.ts
@@ -27,9 +27,12 @@ import {
 } from "./helpers";
 import { messageRoleReversal } from "../../../src/agents/utils";
 
-// Skipped in CI: depends on the OpenAI `gpt-4o-audio-preview` model, which
-// returns 404 model_not_found as of 2026-05-19. Tracked separately — the
-// voice work PR will unskip these tests once model access is restored.
+// Skipped in CI: live end-to-end test — calls OpenAI's `gpt-audio-mini` audio
+// model and the real LangWatch backend (cost, API keys, non-deterministic
+// audio), so it runs live/locally rather than in CI. The skip historically
+// also guarded the now-deleted `gpt-4o-audio-preview` (404 model_not_found
+// since 2026-05-19); #607 swapped that dead model for `gpt-audio-mini`, so the
+// model is no longer the blocker — the skip is CI-cost/live-only now.
 const skipInCi = process.env.CI === "true";
 
 /**