Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 0 additions & 9 deletions charts/azimuth-chat/ci/ui-only-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,12 +5,3 @@ azimuth-llm:
service:
zenith:
enabled: false
appSettings:
# Verify that we can set non-standard LLM params
llm_params:
max_tokens: 101
temperature: 0.1
top_p: 0.15
top_k: 1
presence_penalty: 0.9
frequency_penalty: 1
16 changes: 16 additions & 0 deletions charts/azimuth-chat/ci/ui-param-overrides.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
azimuth-llm:
api:
enabled: false
ui:
service:
zenith:
enabled: false
appSettings:
# Verify that we can set non-standard LLM params
llm_params:
max_tokens: 101
temperature: 0.1
top_p: 0.15
top_k: 1
presence_penalty: 0.9
frequency_penalty: 1
1 change: 0 additions & 1 deletion web-apps/chat/app.py
Original file line number Diff line number Diff line change
Expand Up @@ -61,7 +61,6 @@ class PossibleSystemPromptException(Exception):
streaming=True,
)


def inference(latest_message, history):
# Allow mutating global variable
global BACKEND_INITIALISED
Expand Down
10 changes: 5 additions & 5 deletions web-apps/chat/defaults.yml
Original file line number Diff line number Diff line change
Expand Up @@ -14,12 +14,12 @@ page_title: Large Language Model
# See https://platform.openai.com/docs/api-reference/chat/create
# and https://docs.vllm.ai/en/v0.6.0/serving/openai_compatible_server.html#extra-parameters
llm_params:
max_tokens:
max_tokens: 1000
temperature: 0
top_p:
top_k:
frequency_penalty:
presence_penalty:
top_p: 1
top_k: -1
frequency_penalty: 0
presence_penalty: 0

# Gradio theme constructor parameters (e.g. 'primary_hue')
# See https://www.gradio.app/guides/theming-guide
Expand Down
2 changes: 1 addition & 1 deletion web-apps/utils/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -95,7 +95,7 @@ def load_settings() -> dict:
"Please check for typos"
)
settings = {**defaults, **overrides}
if "backend_url" not in settings or not settings["backend_url"]:
if "backend_url" not in settings or settings["backend_url"] == defaults["backend_url"]:
# Try to detect in-cluster address
in_cluster_backend = api_address_in_cluster()
if not in_cluster_backend:
Expand Down
Loading