quick fix to use openai instead of ollama, in vetor_storage.py

2026-02-05 00:04:10 +03:00
parent f87f3c0cdd
commit 833aad317a
2 changed files with 40 additions and 13 deletions
--- a/services/rag/langchain/QWEN.md
+++ b/services/rag/langchain/QWEN.md
@@ -105,12 +105,19 @@ The project is organized into 8 development phases as outlined in `PLANNING.md`:
 The project uses environment variables for configuration:
 ```env
 # Embedding configuration
 OLLAMA_EMBEDDING_MODEL=MODEL      # Name of the Ollama model for embeddings
 OPENAI_EMBEDDING_MODEL=MODEL      # Name of the OpenAI model for embeddings (default: text-embedding-ada-002)
 OPENAI_EMBEDDING_BASE_URL=URL     # OpenAI-compatible API URL for embeddings
 OPENAI_EMBEDDING_API_KEY=KEY      # API key for OpenAI-compatible embedding service
 EMBEDDING_STRATEGY=ollama         # Strategy to use for embeddings: "ollama" (default) or "openai"
 # Chat model configuration
 OLLAMA_CHAT_MODEL=MODEL           # Name of the Ollama model for chat
-OPENAI_CHAT_URL=URL               # OpenAI-compatible API URL
+OPENAI_CHAT_URL=URL               # OpenAI-compatible API URL for chat
-OPENAI_CHAT_KEY=KEY               # Authorization token for OpenAI-compatible API
+OPENAI_CHAT_KEY=KEY               # Authorization token for OpenAI-compatible API for chat
-OPENAI_CHAT_MODEL=MODEL           # Name of the OpenAI-compatible model to use
+OPENAI_CHAT_MODEL=MODEL           # Name of the OpenAI-compatible model to use for chat
-CHAT_MODEL_STRATEGY=ollama        # Strategy to use: "ollama" (default) or "openai"
+CHAT_MODEL_STRATEGY=ollama        # Strategy to use for chat: "ollama" (default) or "openai"
 ```
 ## Building and Running
@@ -235,3 +242,5 @@ The project is in early development phase. The virtual environment is set up and
 - If encountering "No module named 'unstructured_inference'" error, install unstructured-inference
 - If seeing OCR-related errors, ensure tesseract is installed at the system level and unstructured-pytesseract is available
 - For language detection issues, verify that appropriate spaCy models are downloaded
 - If getting Ollama connection errors when using OpenAI strategy, ensure EMBEDDING_STRATEGY is set correctly in .env
 - When deploying without Ollama, set both CHAT_MODEL_STRATEGY and EMBEDDING_STRATEGY to "openai" in your .env file
--- a/services/rag/langchain/vector_storage.py
+++ b/services/rag/langchain/vector_storage.py
@@ -1,4 +1,4 @@
-"""Vector storage module using Qdrant and Ollama embeddings for the RAG solution."""
+"""Vector storage module using Qdrant and configurable embeddings for the RAG solution."""
 import os
 from typing import Optional
@@ -7,6 +7,7 @@ from dotenv import load_dotenv
 from langchain_qdrant import QdrantVectorStore
 from langchain_core.documents import Document
 from langchain_ollama import OllamaEmbeddings
 from langchain_openai import OpenAIEmbeddings
 from qdrant_client import QdrantClient
 # Load environment variables
@@ -17,15 +18,19 @@ QDRANT_HOST = os.getenv("QDRANT_HOST", "localhost")
 QDRANT_REST_PORT = int(os.getenv("QDRANT_REST_PORT", 6333))
 QDRANT_GRPC_PORT = int(os.getenv("QDRANT_GRPC_PORT", 6334))
-# Ollama embedding model configuration
+# Embedding model configuration
 EMBEDDING_STRATEGY = os.getenv("EMBEDDING_STRATEGY", "ollama").lower()
 OLLAMA_EMBEDDING_MODEL = os.getenv("OLLAMA_EMBEDDING_MODEL", "nomic-embed-text")
 OPENAI_EMBEDDING_MODEL = os.getenv("OPENAI_EMBEDDING_MODEL", "text-embedding-ada-002")
 OPENAI_EMBEDDING_BASE_URL = os.getenv("OPENAI_EMBEDDING_BASE_URL")
 OPENAI_EMBEDDING_API_KEY = os.getenv("OPENAI_EMBEDDING_API_KEY")
 def initialize_vector_store(
    collection_name: str = "documents_langchain", recreate_collection: bool = False
 ) -> QdrantVectorStore:
    """
-    Initialize and return a Qdrant vector store with Ollama embeddings.
+    Initialize and return a Qdrant vector store with configurable embeddings.
    Args:
        collection_name: Name of the Qdrant collection to use
@@ -34,11 +39,24 @@ def initialize_vector_store(
    Returns:
        Initialized Qdrant vector store
    """
-    # Initialize Ollama embeddings
+    # Determine which embedding strategy to use
-    embeddings = OllamaEmbeddings(
+    if EMBEDDING_STRATEGY == "openai":
-        model=OLLAMA_EMBEDDING_MODEL,
+        # Validate required OpenAI embedding variables
-        base_url="http://localhost:11434",  # Default Ollama URL
+        if not OPENAI_EMBEDDING_API_KEY or not OPENAI_EMBEDDING_BASE_URL:
-    )
+            raise ValueError("OPENAI_EMBEDDING_API_KEY and OPENAI_EMBEDDING_BASE_URL must be set when using OpenAI embedding strategy")
        # Initialize OpenAI embeddings
        embeddings = OpenAIEmbeddings(
            model=OPENAI_EMBEDDING_MODEL,
            openai_api_base=OPENAI_EMBEDDING_BASE_URL,
            openai_api_key=OPENAI_EMBEDDING_API_KEY,
        )
    else:  # Default to ollama
        # Initialize Ollama embeddings
        embeddings = OllamaEmbeddings(
            model=OLLAMA_EMBEDDING_MODEL,
            base_url="http://localhost:11434",  # Default Ollama URL
        )
    # Check if collection exists and create if needed
    client = QdrantClient(