fix: predicator

voiceflow · Apr 3, 2024 · 15085c5 · 15085c5
1 parent 4be68ef
commit 15085c5
Show file tree

Hide file tree

Showing 5 changed files with 717 additions and 24 deletions.
diff --git a/lib/services/classification/index.ts b/lib/services/classification/index.ts
@@ -0,0 +1 @@
+export * from './predictor.class';
diff --git a/lib/services/classification/predictor.class.ts b/lib/services/classification/predictor.class.ts
@@ -0,0 +1,361 @@
+import { Utils } from '@voiceflow/common';
+import { DEFAULT_INTENT_CLASSIFICATION_PROMPT_WRAPPER_CODE } from '@voiceflow/default-prompt-wrappers';
+import { IntentClassificationSettings } from '@voiceflow/dtos';
+import { ISlotFullfilment } from '@voiceflow/natural-language-commander';
+import { VoiceflowConstants } from '@voiceflow/voiceflow-types';
+import type { AxiosStatic } from 'axios';
+import { match } from 'ts-pattern';
+
+import MLGateway from '@/lib/clients/ml-gateway';
+import logger from '@/logger';
+
+import { handleNLCCommand } from '../nlu/nlc';
+import { mapChannelIntent } from '../nlu/utils';
+import { isIntentClassificationLLMSettings, isIntentClassificationNLUSettings } from './classification.utils';
+import {
+  ClassificationResult,
+  NLUIntentPrediction,
+  NLUPredictOptions,
+  PredictedSlot,
+  Prediction,
+  PredictOptions,
+  PredictRequest,
+} from './interfaces/nlu.interface';
+import { executePromptWrapper } from './prompt-wrapper-executor';
+
+const ML_GATEWAY_TIMEOUT = 5000;
+
+const nonePrediction: Omit<Prediction, 'utterance'> = {
+  predictedIntent: VoiceflowConstants.IntentName.NONE,
+  predictedSlots: [],
+  confidence: 100,
+};
+
+const hasValueReducer = (slots?: ISlotFullfilment[]) =>
+  (slots ?? []).reduce<{ name: string; value: string }[]>(
+    (acc, { name, value }) => (value ? [...acc, { name, value }] : acc),
+    []
+  );
+
+export interface PredictorConfig {
+  axios: AxiosStatic;
+  mlGateway: MLGateway;
+  CLOUD_ENV: string;
+  NLU_GATEWAY_SERVICE_HOST: string | null;
+  NLU_GATEWAY_SERVICE_PORT_APP: string | null;
+}
+
+export class Predictor {
+  private intentNameMap: any = {};
+
+  readonly predictions: Partial<ClassificationResult> = {};
+
+  constructor(
+    private config: PredictorConfig,
+    private props: PredictRequest,
+    private settings: IntentClassificationSettings,
+    private options: PredictOptions
+  ) {
+    // match NLU prediction intents to NLU model
+    this.intentNameMap = Object.fromEntries(props.intents.map((intent) => [intent.name, intent]));
+  }
+
+  private get nluGatewayURL() {
+    const protocol = this.config.CLOUD_ENV === 'e2e' ? 'https' : 'http';
+    return `${protocol}://${this.config.NLU_GATEWAY_SERVICE_HOST}:${this.config.NLU_GATEWAY_SERVICE_PORT_APP}`;
+  }
+
+  // return all the same prediction shape?
+  public async nlc(utterance: string, openSlot = false): Promise<Prediction | null> {
+    if (!this.props.intents.length) {
+      this.predictions.nlc = {
+        openSlot,
+        error: {
+          message: 'No intents to match against',
+        },
+      };
+      return null;
+    }
+    const data = handleNLCCommand({
+      query: utterance,
+      model: {
+        intents: this.props.intents,
+        slots: this.props.slots ?? [],
+      },
+      locale: this.options.locale,
+      openSlot,
+    });
+
+    if (!data) {
+      this.predictions.nlc = {
+        openSlot,
+        error: {
+          message: 'No matches found',
+        },
+      };
+      return null;
+    }
+
+    const response = {
+      predictedIntent: mapChannelIntent(data?.intent),
+      predictedSlots: hasValueReducer(data?.slots),
+      confidence: data.confidence,
+      utterance,
+    };
+
+    this.predictions.nlc = {
+      ...this.predictions.nlc,
+      ...response,
+      openSlot,
+    };
+
+    return response;
+  }
+
+  public async fillSlots(utterance: string, options?: NLUPredictOptions): Promise<PredictedSlot[] | null> {
+    const prediction = await this.nluGatewayPrediction(utterance, options);
+
+    if (!prediction) {
+      this.predictions.fillSlots = {
+        error: {
+          message: 'Something went wrong filling slots',
+        },
+      };
+      return null;
+    }
+
+    this.predictions.fillSlots = prediction.predictedSlots;
+
+    return prediction.predictedSlots;
+  }
+
+  private async nluGatewayPrediction(utterance: string, options?: NLUPredictOptions) {
+    const { data: prediction } = await this.config.axios
+      .post<NLUIntentPrediction | null>(`${this.nluGatewayURL}/v1/predict/${this.props.versionID}`, {
+        utterance,
+        tag: this.props.tag,
+        workspaceID: this.props.workspaceID,
+        filteredIntents: options?.filteredIntents ?? [],
+        filteredEntities: options?.filteredEntities ?? [],
+        excludeFilteredIntents: false,
+        excludeFilteredEntities: false,
+        limit: 10,
+      })
+      .catch((err: Error) => {
+        logger.error(err, 'Something went wrong with NLU prediction');
+        return { data: null };
+      });
+    return prediction;
+  }
+
+  public async nlu(utterance: string, options?: NLUPredictOptions): Promise<NLUIntentPrediction | null> {
+    const prediction = await this.nluGatewayPrediction(utterance, options);
+    if (!prediction) {
+      this.predictions.nlu = {
+        error: {
+          message: 'Something went wrong with NLU prediction',
+        },
+      };
+      return null;
+    }
+
+    this.predictions.nlu = prediction;
+
+    if (isIntentClassificationNLUSettings(this.settings) && prediction?.confidence < this.settings.params.confidence) {
+      this.predictions.nlu = {
+        ...prediction,
+        error: {
+          message: 'NLU predicted confidence below settings threshold',
+        },
+      };
+      return null;
+    }
+
+    return prediction;
+  }
+
+  public async llm(
+    nluPrediction: NLUIntentPrediction,
+    { mlGateway }: { mlGateway: MLGateway }
+  ): Promise<Omit<Prediction, 'predictedSlots'> | null> {
+    if (!isIntentClassificationLLMSettings(this.settings)) {
+      return null;
+    }
+
+    const promptContent = this.settings.promptWrapper?.content ?? DEFAULT_INTENT_CLASSIFICATION_PROMPT_WRAPPER_CODE;
+
+    const intents = nluPrediction.intents
+      // filter out none intent
+      .filter((intent) => intent.name !== VoiceflowConstants.IntentName.NONE)
+      .map((intent) => this.intentNameMap[intent.name])
+      // TODO: PL-897
+      .filter(Utils.array.isNotNullish);
+
+    if (!intents.length) return nluPrediction;
+
+    const promptArgs = {
+      intents,
+      query: nluPrediction.utterance,
+    };
+
+    let prompt;
+    try {
+      const result = await executePromptWrapper(promptContent, promptArgs);
+      prompt = result.prompt;
+    } catch (err) {
+      logger.error(err, 'PromptWrapperError: went real bad');
+      this.predictions.llm = {
+        error: {
+          message: 'PromptWrapperError: went real bad',
+        },
+      };
+      return null;
+    }
+
+    const completionResponse = await mlGateway.private?.completion
+      .generateCompletion({
+        workspaceID: this.props.workspaceID,
+        prompt,
+        params: {
+          // TODO: models are different between ml gateway sdk and dtos package
+          model: this.settings.params.model,
+          temperature: this.settings.params.temperature,
+        },
+        options: {
+          timeout: ML_GATEWAY_TIMEOUT,
+        },
+      })
+      .catch((error: Error) => {
+        logger.error(error, '[hybridPredict intent classification]');
+        this.predictions.llm = {
+          error: {
+            message: `Falling back to NLU`,
+          },
+        };
+        return null;
+      });
+
+    if (!completionResponse?.output) {
+      this.predictions.llm = {
+        error: {
+          message: `unable to get LLM result, potential timeout`,
+        },
+      };
+      return null;
+    }
+
+    // validate llm output as a valid intent
+    const matchedIntent = this.props.intents.find((intent) => intent.name === completionResponse.output);
+    const { error } = completionResponse;
+
+    this.predictions.llm = {
+      ...completionResponse,
+      error: !error ? undefined : { message: error },
+    };
+
+    if (!matchedIntent) {
+      this.predictions.llm = {
+        ...this.predictions.llm,
+        error: {
+          message: "LLM prediction didn't match any intents, falling back to NLU",
+        },
+      };
+      return null;
+    }
+
+    const response = {
+      utterance: nluPrediction.utterance,
+      predictedIntent: matchedIntent.name,
+      predictedSlots: [],
+      confidence: 1,
+      model: completionResponse.model,
+      multiplier: completionResponse.multiplier,
+      tokens: completionResponse.tokens,
+    };
+
+    this.predictions.llm = response;
+
+    return response;
+  }
+
+  public async predict(utterance: string): Promise<Prediction | null> {
+    // 1. first try restricted regex (no open slots) - exact string match
+    const nlcPrediction = await this.nlc(utterance, false);
+    if (nlcPrediction) {
+      this.predictions.result = 'nlc';
+      return nlcPrediction;
+    }
+
+    const nluPrediction = await this.nlu(utterance, this.options);
+
+    if (!nluPrediction) {
+      // try open regex slot matching
+      this.predictions.result = 'nlc';
+      const openPrediction = await this.nlc(utterance, true);
+      return (
+        openPrediction ?? {
+          ...nonePrediction,
+          utterance,
+        }
+      );
+    }
+
+    if (isIntentClassificationNLUSettings(this.settings)) {
+      this.predictions.result = 'nlu';
+      return nluPrediction;
+    }
+
+    if (isIntentClassificationLLMSettings(this.settings)) {
+      const llmPrediction = await this.llm(nluPrediction, {
+        mlGateway: this.config.mlGateway,
+      });
+
+      if (!llmPrediction) {
+        // fallback to NLU prediction
+        this.predictions.result = 'nlu';
+        return nluPrediction;
+      }
+
+      this.predictions.result = 'llm';
+
+      // STEP 4: retrieve intent from intent map
+      const intent = this.intentNameMap[llmPrediction.predictedIntent];
+
+      // slot filling
+      const slots = await match({
+        predicted: llmPrediction.predictedIntent === nluPrediction.predictedIntent,
+        hasSlots: !!intent.slots?.length,
+      })
+        .with({ predicted: true }, () => nluPrediction.predictedSlots)
+        .with({ predicted: false, hasSlots: true }, () =>
+          this.fillSlots(utterance, {
+            filteredIntents: [llmPrediction.predictedIntent],
+          })
+        )
+        .otherwise(() => []);
+
+      return {
+        ...llmPrediction,
+        predictedSlots: slots ?? [],
+      };
+    }
+
+    // finally try open regex slot matching
+    this.predictions.result = 'nlc';
+    const openPrediction = await this.nlc(utterance, true);
+    return (
+      openPrediction ?? {
+        ...nonePrediction,
+        utterance,
+      }
+    );
+  }
+
+  public hasErrors() {
+    return this.predictions.nlc?.error || this.predictions.nlu?.error || this.predictions.llm?.error;
+  }
+
+  public get classificationType() {
+    return this.settings.type;
+  }
+}
diff --git a/package.json b/package.json
@@ -22,6 +22,7 @@
     "@voiceflow/body-parser": "^1.21.1",
     "@voiceflow/chat-types": "2.13.104",
     "@voiceflow/common": "8.2.8",
+    "@voiceflow/default-prompt-wrappers": "^1.1.1",
     "@voiceflow/dtos": "1.51.1",
     "@voiceflow/event-ingestion-service": "1.5.1",
     "@voiceflow/exception": "^1.5.1",
@@ -30,7 +31,7 @@
     "@voiceflow/logger": "2.2.0",
     "@voiceflow/metrics": "1.4.1",
     "@voiceflow/natural-language-commander": "^0.5.1",
-    "@voiceflow/sdk-http-ml-gateway": "2.12.4",
+    "@voiceflow/sdk-http-ml-gateway": "2.13.31",
     "@voiceflow/utils-designer": "1.9.3",
     "@voiceflow/verror": "^1.1.3",
     "@voiceflow/voice-types": "2.9.83",