uses APIM with multiple models (#207)

paullizer · web-flow · commit 1100eaec1b4b · 2025-05-22T14:54:23.000-04:00
diff --git a/application/single_app/config.py b/application/single_app/config.py
@@ -86,7 +86,7 @@
 
 app.config['SECRET_KEY'] = os.getenv("SECRET_KEY")
 app.config['SESSION_TYPE'] = 'filesystem'
-app.config['VERSION'] = '0.213.002'
+app.config['VERSION'] = '0.213.003'
 Session(app)
 
 CLIENTS = {}
diff --git a/application/single_app/route_backend_chats.py b/application/single_app/route_backend_chats.py
@@ -63,8 +63,36 @@ def chat_api():
 
         try:
             if enable_gpt_apim:
-                gpt_model = settings.get('azure_apim_gpt_deployment')
-                if not gpt_model: raise ValueError("APIM GPT deployment name not configured.")
+                # read raw comma-delimited deployments
+                raw = settings.get('azure_apim_gpt_deployment', '')
+                if not raw:
+                    raise ValueError("APIM GPT deployment name not configured.")
+
+                # split, strip, and filter out empty entries
+                apim_models = [m.strip() for m in raw.split(',') if m.strip()]
+                if not apim_models:
+                    raise ValueError("No valid APIM GPT deployment names found.")
+
+                # if frontend specified one, use it (must be in the configured list)
+                if frontend_gpt_model:
+                    if frontend_gpt_model not in apim_models:
+                        raise ValueError(
+                            f"Requested model '{frontend_gpt_model}' is not configured for APIM."
+                        )
+                    gpt_model = frontend_gpt_model
+
+                # otherwise if there's exactly one deployment, default to it
+                elif len(apim_models) == 1:
+                    gpt_model = apim_models[0]
+
+                # otherwise you must pass model_deployment in the request
+                else:
+                    raise ValueError(
+                        "Multiple APIM GPT deployments configured; please include "
+                        "'model_deployment' in your request."
+                    )
+
+                # initialize the APIM client
                 gpt_client = AzureOpenAI(
                     api_version=settings.get('azure_apim_gpt_api_version'),
                     azure_endpoint=settings.get('azure_apim_gpt_endpoint'),