diff --git a/common/arg.cpp b/common/arg.cpp index 4115b2f7511d3..bb005689c1095 100644 --- a/common/arg.cpp +++ b/common/arg.cpp @@ -852,7 +852,7 @@ common_params_context common_params_parser_init(common_params & params, llama_ex params.input_prefix = value; params.enable_chat_template = false; } - ).set_examples({LLAMA_EXAMPLE_MAIN, LLAMA_EXAMPLE_INFILL})); + ).set_examples({LLAMA_EXAMPLE_MAIN, LLAMA_EXAMPLE_SERVER, LLAMA_EXAMPLE_INFILL})); add_opt(common_arg( {"--in-suffix"}, "STRING", "string to suffix after user inputs with (default: empty)", @@ -860,7 +860,7 @@ common_params_context common_params_parser_init(common_params & params, llama_ex params.input_suffix = value; params.enable_chat_template = false; } - ).set_examples({LLAMA_EXAMPLE_MAIN, LLAMA_EXAMPLE_INFILL})); + ).set_examples({LLAMA_EXAMPLE_MAIN, LLAMA_EXAMPLE_SERVER, LLAMA_EXAMPLE_INFILL})); add_opt(common_arg( {"--no-warmup"}, "skip warming up the model with an empty run", diff --git a/examples/server/public/index.html b/examples/server/public/index.html index 6216c08410a28..27570a1eeea67 100644 --- a/examples/server/public/index.html +++ b/examples/server/public/index.html @@ -214,6 +214,10 @@

Settings

+ + + +