fix: test cases

namchuai · namchuai · commit cceeb06d1eb3 · 2024-06-20T16:07:38.000+07:00
Signed-off-by: James &lt;namnh0122@gmail.com&gt;
diff --git a/cortex-js/src/infrastructure/controllers/assistants.controller.spec.ts b/cortex-js/src/infrastructure/controllers/assistants.controller.spec.ts
@@ -2,13 +2,21 @@ import { Test, TestingModule } from '@nestjs/testing';
 import { AssistantsController } from './assistants.controller';
 import { AssistantsUsecases } from '@/usecases/assistants/assistants.usecases';
 import { DatabaseModule } from '@/infrastructure/database/database.module';
+import { ModelRepositoryModule } from '../repositories/models/model.module';
+import { DownloadManagerModule } from '../services/download-manager/download-manager.module';
+import { EventEmitterModule } from '@nestjs/event-emitter';
 
 describe('AssistantsController', () => {
   let controller: AssistantsController;
 
   beforeEach(async () => {
     const module: TestingModule = await Test.createTestingModule({
-      imports: [DatabaseModule],
+      imports: [
+        EventEmitterModule.forRoot(),
+        DatabaseModule,
+        ModelRepositoryModule,
+        DownloadManagerModule,
+      ],
       controllers: [AssistantsController],
       providers: [AssistantsUsecases],
       exports: [AssistantsUsecases],
diff --git a/cortex-js/src/infrastructure/dtos/assistants/model-setting.dto.ts b/cortex-js/src/infrastructure/dtos/assistants/model-setting.dto.ts
@@ -0,0 +1,208 @@
+import { ApiProperty } from '@nestjs/swagger';
+import { IsArray, IsOptional } from 'class-validator';
+
+export class ModelSettingDto {
+  @ApiProperty({
+    type: 'number',
+    minimum: 0,
+    maximum: 1,
+    required: false,
+    default: 1,
+    description: `What sampling temperature to use, between 0 and 2. Higher values like 0.8 will make the output more random, while lower values like 0.2 will make it more focused and deterministic.`,
+  })
+  temperature: number;
+
+  @ApiProperty({
+    type: 'number',
+    minimum: 0,
+    maximum: 1,
+    required: false,
+    default: 1,
+    description: `An alternative to sampling with temperature, called nucleus sampling, where the model considers the results of the tokens with top_p probability mass. So 0.1 means only the tokens comprising the top 10% probability mass are considered.\nWe generally recommend altering this or temperature but not both.`,
+  })
+  top_p: number;
+
+  @ApiProperty({
+    required: false,
+    example: '',
+    description: 'GGUF metadata: tokenizer.chat_template',
+  })
+  prompt_template?: string;
+
+  @ApiProperty({
+    required: false,
+    example: [],
+    description:
+      'Defines specific tokens or phrases at which the model will stop generating further output.',
+    default: [],
+  })
+  @IsArray()
+  @IsOptional()
+  stop?: string[];
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 0,
+    description:
+      'Adjusts the likelihood of the model repeating words or phrases in its output.',
+  })
+  frequency_penalty?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 0,
+    description:
+      'Influences the generation of new and varied concepts in the model’s output.',
+  })
+  presence_penalty?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 4096,
+    default: 4096,
+    description:
+      'The context length for model operations varies; the maximum depends on the specific model used.',
+  })
+  ctx_len?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'boolean',
+    example: true,
+    default: true,
+    description: 'Enable real-time data processing for faster predictions.',
+  })
+  stream?: boolean;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 2048,
+    default: 2048,
+    description:
+      'The maximum number of tokens the model will generate in a single response.',
+  })
+  max_tokens?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 1,
+    default: 1,
+    description: 'The number of layers to load onto the GPU for acceleration.',
+  })
+  ngl?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 1,
+    default: 1,
+    description: 'Number of parallel sequences to decode',
+  })
+  n_parallel?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 1,
+    default: 1,
+    description:
+      'Determines CPU inference threads, limited by hardware and OS. (Maximum determined by system)',
+  })
+  cpu_threads?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'string',
+    example: '',
+    default: '',
+    description: 'The prompt to use for internal configuration',
+  })
+  pre_prompt?: string;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 0,
+    default: 0,
+    description: 'The batch size for prompt eval step',
+  })
+  n_batch?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'boolean',
+    example: true,
+    default: true,
+    description: 'To enable prompt caching or not',
+  })
+  caching_enabled?: boolean;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 0,
+    default: 0,
+    description: 'Group attention factor in self-extend',
+  })
+  grp_attn_n?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'number',
+    example: 0,
+    default: 0,
+    description: 'Group attention width in self-extend',
+  })
+  grp_attn_w?: number;
+
+  @ApiProperty({
+    required: false,
+    type: 'boolean',
+    example: false,
+    default: false,
+    description: 'Prevent system swapping of the model to disk in macOS',
+  })
+  mlock?: boolean;
+
+  @ApiProperty({
+    required: false,
+    type: 'string',
+    example: '',
+    default: '',
+    description:
+      'You can constrain the sampling using GBNF grammars by providing path to a grammar file',
+  })
+  grammar_file?: string;
+
+  @ApiProperty({
+    required: false,
+    type: 'boolean',
+    example: true,
+    default: true,
+    description: 'To enable Flash Attention, default is true',
+  })
+  flash_attn?: boolean;
+
+  @ApiProperty({
+    required: false,
+    type: 'string',
+    example: '',
+    default: '',
+    description: 'KV cache type: f16, q8_0, q4_0, default is f16',
+  })
+  cache_type?: string;
+
+  @ApiProperty({
+    required: false,
+    type: 'boolean',
+    example: true,
+    default: true,
+    description: 'To enable mmap, default is true',
+  })
+  use_mmap?: boolean;
+}
diff --git a/cortex-js/src/infrastructure/repositories/models/model.repository.ts b/cortex-js/src/infrastructure/repositories/models/model.repository.ts
@@ -12,10 +12,7 @@ import {
   writeFileSync,
 } from 'fs';
 import { load, dump } from 'js-yaml';
-import {
-  isLocalModel,
-  normalizeModelId,
-} from '@/utils/normalize-model-id';
+import { isLocalModel, normalizeModelId } from '@/utils/normalize-model-id';
 
 @Injectable()
 export class ModelRepositoryImpl implements ModelRepository {
diff --git a/cortex-js/src/usecases/assistants/assistants.usecases.spec.ts b/cortex-js/src/usecases/assistants/assistants.usecases.spec.ts
@@ -1,13 +1,21 @@
 import { Test, TestingModule } from '@nestjs/testing';
 import { AssistantsUsecases } from './assistants.usecases';
 import { DatabaseModule } from '@/infrastructure/database/database.module';
+import { ModelRepositoryModule } from '@/infrastructure/repositories/models/model.module';
+import { DownloadManagerModule } from '@/infrastructure/services/download-manager/download-manager.module';
+import { EventEmitterModule } from '@nestjs/event-emitter';
 
 describe('AssistantsService', () => {
   let service: AssistantsUsecases;
 
   beforeEach(async () => {
     const module: TestingModule = await Test.createTestingModule({
-      imports: [DatabaseModule],
+      imports: [
+        EventEmitterModule.forRoot(),
+        DatabaseModule,
+        ModelRepositoryModule,
+        DownloadManagerModule,
+      ],
       exports: [AssistantsUsecases],
       providers: [AssistantsUsecases],
     }).compile();