From d9e52573c4697e24f7c9114c4ede6102ed68fbc2 Mon Sep 17 00:00:00 2001 From: hahuyhoang411 Date: Tue, 28 Nov 2023 10:56:19 +0700 Subject: [PATCH 1/2] fix wrong value api ref --- docs/openapi/NitroAPI.yaml | 8 -------- 1 file changed, 8 deletions(-) diff --git a/docs/openapi/NitroAPI.yaml b/docs/openapi/NitroAPI.yaml index 51a932423..847b9f0be 100644 --- a/docs/openapi/NitroAPI.yaml +++ b/docs/openapi/NitroAPI.yaml @@ -441,10 +441,6 @@ components: default: true nullable: true description: Determines if output generation is in a streaming manner. - cache_prompt: - type: boolean - default: true - description: Optimize performance in repeated or similar requests. temp: type: number default: 0.7 @@ -585,10 +581,6 @@ components: min: 0 max: 1 description: Set probability threshold for more relevant outputs - cache_prompt: - type: boolean - default: true - description: Optimize performance in repeated or similar requests. ChatCompletionResponse: type: object description: Description of the response structure From a20dd7d02976cd891e9c01c50f5a845f14ca3c91 Mon Sep 17 00:00:00 2001 From: hahuyhoang411 Date: Tue, 28 Nov 2023 10:58:29 +0700 Subject: [PATCH 2/2] fix order of cpu_threads in the table of params --- docs/docs/features/load-unload.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/docs/features/load-unload.md b/docs/docs/features/load-unload.md index 167e554b1..ca3980069 100644 --- a/docs/docs/features/load-unload.md +++ b/docs/docs/features/load-unload.md @@ -70,8 +70,8 @@ In case you got error while loading models. Please check for the correct model p | `ctx_len` | Integer | The context length for the model operations. | | `embedding` | Boolean | Whether to use embedding in the model. | | `n_parallel` | Integer | The number of parallel operations.| -|`cpu_threads`|Integer|The number of threads for CPU inference.| | `cont_batching` | Boolean | Whether to use continuous batching. | +|`cpu_threads`|Integer|The number of threads for CPU inference.| | `user_prompt` | String | The prompt to use for the user. | | `ai_prompt` | String | The prompt to use for the AI assistant. | | `system_prompt` | String | The prompt for system rules. |