diff --git a/application/api/answer/routes.py b/application/api/answer/routes.py index 3f48d33e4..b694c4aaf 100644 --- a/application/api/answer/routes.py +++ b/application/api/answer/routes.py @@ -118,6 +118,8 @@ def complete_stream(question, docsearch, chat_history, api_key, conversation_id) docs = docsearch.search(question, k=2) + if settings.LLM_NAME == "llama.cpp": + docs = [docs[0]] # join all page_content together with a newline docs_together = "\n".join([doc.page_content for doc in docs]) p_chat_combine = chat_combine_template.replace("{summaries}", docs_together) diff --git a/application/api/user/routes.py b/application/api/user/routes.py index 2b1d505a5..56b020197 100644 --- a/application/api/user/routes.py +++ b/application/api/user/routes.py @@ -6,7 +6,6 @@ from bson.objectid import ObjectId from werkzeug.utils import secure_filename import http.client -from celery.result import AsyncResult from application.api.user.tasks import ingest @@ -142,7 +141,8 @@ def upload_file(): def task_status(): """Get celery job status.""" task_id = request.args.get("task_id") - task = AsyncResult(task_id) + from application.celery import celery + task = celery.AsyncResult(task_id) task_meta = task.info return {"status": task.status, "result": task_meta} diff --git a/application/celery.py b/application/celery.py index 3b4819e73..c19c2e754 100644 --- a/application/celery.py +++ b/application/celery.py @@ -2,7 +2,7 @@ from application.core.settings import settings def make_celery(app_name=__name__): - celery = Celery(app_name, broker=settings.CELERY_BROKER_URL) + celery = Celery(app_name, broker=settings.CELERY_BROKER_URL, backend=settings.CELERY_RESULT_BACKEND) celery.conf.update(settings) return celery diff --git a/application/core/settings.py b/application/core/settings.py index 57a9f1c13..a05fd00b5 100644 --- a/application/core/settings.py +++ b/application/core/settings.py @@ -2,7 +2,7 @@ import os from pydantic import BaseSettings -current_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) +current_dir = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))) class Settings(BaseSettings): diff --git a/application/llm/llama_cpp.py b/application/llm/llama_cpp.py index ebd713c54..f18d4379e 100644 --- a/application/llm/llama_cpp.py +++ b/application/llm/llama_cpp.py @@ -1,15 +1,16 @@ from application.llm.base import BaseLLM +from application.core.settings import settings class LlamaCpp(BaseLLM): - def __init__(self, api_key, llm_name='/Users/pavel/Desktop/docsgpt/application/models/orca-test.bin'): + def __init__(self, api_key, llm_name=settings.MODEL_PATH, **kwargs): global llama try: from llama_cpp import Llama except ImportError: raise ImportError("Please install llama_cpp using pip install llama-cpp-python") - llama = Llama(model_path=llm_name) + llama = Llama(model_path=llm_name, n_ctx=2048) def gen(self, model, engine, messages, stream=False, **kwargs): context = messages[0]['content'] diff --git a/docker-compose-local.yaml b/docker-compose-local.yaml index b24ed4886..3aebe8b50 100644 --- a/docker-compose-local.yaml +++ b/docker-compose-local.yaml @@ -6,42 +6,10 @@ services: environment: - VITE_API_HOST=http://localhost:7091 - VITE_API_STREAMING=$VITE_API_STREAMING + - VITE_EMBEDDINGS_NAME=$EMBEDDINGS_NAME ports: - "5173:5173" - # backend: - # build: ./application - # environment: - # - LLM_NAME=$LLM_NAME - # - EMBEDDINGS_NAME=$EMBEDDINGS_NAME - # - CELERY_BROKER_URL=redis://redis:6379/0 - # - CELERY_RESULT_BACKEND=redis://redis:6379/1 - # - MONGO_URI=mongodb://mongo:27017/docsgpt - # ports: - # - "7091:7091" - # volumes: - # - ./application/indexes:/app/application/indexes - # - ./application/inputs:/app/application/inputs - # - ./application/vectors:/app/application/vectors - # - ./application/models:/app/application/models - # depends_on: - # - redis - # - mongo - - worker: - build: ./application - command: celery -A application.app.celery worker -l INFO - environment: - - LLM_NAME=$LLM_NAME - - EMBEDDINGS_NAME=$EMBEDDINGS_NAME - - CELERY_BROKER_URL=redis://redis:6379/0 - - CELERY_RESULT_BACKEND=redis://redis:6379/1 - - MONGO_URI=mongodb://mongo:27017/docsgpt - - API_URL=http://backend:7091 - depends_on: - - redis - - mongo - redis: image: redis:6-alpine ports: diff --git a/frontend/src/Navigation.tsx b/frontend/src/Navigation.tsx index c5488a508..9f84b97f0 100644 --- a/frontend/src/Navigation.tsx +++ b/frontend/src/Navigation.tsx @@ -59,6 +59,7 @@ export default function Navigation({ const navRef = useRef(null); const apiHost = import.meta.env.VITE_API_HOST || 'https://docsapi.arc53.com'; + const embeddingsName = import.meta.env.VITE_EMBEDDINGS_NAME || 'openai_text-embedding-ada-002'; useEffect(() => { if (!conversations) { @@ -253,7 +254,7 @@ export default function Navigation({
{docs ? ( docs.map((doc, index) => { - if (doc.model === 'openai_text-embedding-ada-002') { + if (doc.model === embeddingsName) { return (