From e8037de99b5a703c97983cc66496e037992953ab Mon Sep 17 00:00:00 2001 From: Ayush Singhal Date: Fri, 6 Feb 2026 19:19:02 +0530 Subject: [PATCH] update backend url --- .env.example | 2 +- src/app/conversation/schemas/request.py | 3 +-- src/app/llm_model/enums/ModelName.py | 14 -------------- src/app/llm_model/enums/__init__.py | 3 +-- src/services/llm_service/factory.py | 6 +++--- src/setup/config/config.py | 2 +- 6 files changed, 7 insertions(+), 23 deletions(-) delete mode 100644 src/app/llm_model/enums/ModelName.py diff --git a/.env.example b/.env.example index 75522e2..2dd2bb0 100644 --- a/.env.example +++ b/.env.example @@ -16,6 +16,6 @@ GOOGLE_API_KEY=key_here LOG_LEVEL=INFO LOG_FORMAT=standard -BACKEND_URL=http://localhost:8000/internal/v1 +BACKEND_URL=http://localhost:8000/internal SECRET_ENCRYPTION_KEY=secure_key_here diff --git a/src/app/conversation/schemas/request.py b/src/app/conversation/schemas/request.py index c5282df..4ae7bcf 100644 --- a/src/app/conversation/schemas/request.py +++ b/src/app/conversation/schemas/request.py @@ -1,7 +1,6 @@ from pydantic import BaseModel, Field, field_validator from typing import Optional, List, Dict -from src.app.llm_model.enums.ModelName import ModelName from src.app.llm_model.enums.ModelProvider import ModelProvider from src.core.exceptions import ValidationError @@ -9,7 +8,7 @@ class ChatRequest(BaseModel): profile_id: str query: str - model: ModelName + model: str provider: ModelProvider temperature: Optional[float] = Field(default=0.7, ge=0.0, le=2.0) max_tokens: Optional[int] = Field(default=None, gt=0) diff --git a/src/app/llm_model/enums/ModelName.py b/src/app/llm_model/enums/ModelName.py deleted file mode 100644 index 5e94dcb..0000000 --- a/src/app/llm_model/enums/ModelName.py +++ /dev/null @@ -1,14 +0,0 @@ -from src.core.enums.BaseEnum import BaseEnum - - -class ModelName(BaseEnum): - GPT_4_1_MINI = "gpt-4.1-mini" - GPT_4_1_NANO = "gpt-4.1-nano" - DALL_E_3 = "dall-e-3" - CLAUDE_3_7_SONNET = "claude-3.7-sonnet" - CLAUDE_3_5_HAIKU = "claude-3.5-haiku" - GEMINI_2_5_PRO = "gemini-2.5-pro" - GEMINI_2_5_FLASH = "gemini-2.5-flash" - GEMINI_2_5_FLASH_IMAGE_PREVIEW = "gemini-2.5-flash-image-preview" - MISTRAL_7B = "mistral-7b" - LLAMA_2 = "llama-2" diff --git a/src/app/llm_model/enums/__init__.py b/src/app/llm_model/enums/__init__.py index c04d2c2..18be3e0 100644 --- a/src/app/llm_model/enums/__init__.py +++ b/src/app/llm_model/enums/__init__.py @@ -1,6 +1,5 @@ -from src.app.llm_model.enums.ModelName import ModelName from src.app.llm_model.enums.ModelProvider import ModelProvider from src.app.llm_model.enums.QueryType import QueryType from src.app.conversation.enums.FileType import FileType -__all__ = [ModelName, ModelProvider, QueryType, FileType] +__all__ = [ModelProvider, QueryType, FileType] diff --git a/src/services/llm_service/factory.py b/src/services/llm_service/factory.py index 51391ab..5e322f4 100644 --- a/src/services/llm_service/factory.py +++ b/src/services/llm_service/factory.py @@ -1,7 +1,7 @@ from sqlalchemy.ext.asyncio import AsyncSession from src.app.conversation.schemas import ChatRequest -from src.app.llm_model.enums import ModelProvider, ModelName +from src.app.llm_model.enums import ModelProvider from src.app.llm_model.repository import LLMModelRepo from src.core.exceptions import ValidationError from src.core.exceptions.BaseError import BaseError @@ -63,9 +63,9 @@ async def get_llm_provider( raise BaseError(f"Failed to initialize {provider.value} service: {str(e)}") from e @classmethod - async def validate_model(cls, db: AsyncSession, model: ModelName, provider: ModelProvider): + async def validate_model(cls, db: AsyncSession, model: str, provider: ModelProvider): llm_repo = LLMModelRepo(db).repo - llm_model = await llm_repo.get(db=db, code=model.value, provider=provider.label, deleted_at=None) + llm_model = await llm_repo.get(db=db, code=model, provider=provider.label, deleted_at=None) if llm_model is None or llm_model.get('is_active', False) == False: raise BaseError("Model is not in use") return llm_model diff --git a/src/setup/config/config.py b/src/setup/config/config.py index 5435497..32ecb9d 100644 --- a/src/setup/config/config.py +++ b/src/setup/config/config.py @@ -21,7 +21,7 @@ class Config(BaseSettings): anthropic_api_key: str = "" google_api_key: str = "" - backend_url: str = "http://localhost:8000/internal/v1" + backend_url: str = "http://localhost:8000/internal" timeout: int = 60 max_retries: int = 3