rag-solution/services/rag/langchain/vector_storage.py

"""Vector storage module using Qdrant and Ollama embeddings for the RAG solution."""

import os
from typing import Optional

from dotenv import load_dotenv
from langchain_community.vectorstores import Qdrant
from langchain_core.documents import Document
from langchain_ollama import OllamaEmbeddings
from qdrant_client import QdrantClient

# Load environment variables
load_dotenv()

# Qdrant configuration
QDRANT_HOST = os.getenv("QDRANT_HOST", "localhost")
QDRANT_REST_PORT = int(os.getenv("QDRANT_REST_PORT", 6333))
QDRANT_GRPC_PORT = int(os.getenv("QDRANT_GRPC_PORT", 6334))

# Ollama embedding model configuration
OLLAMA_EMBEDDING_MODEL = os.getenv("OLLAMA_EMBEDDING_MODEL", "nomic-embed-text")


def initialize_vector_store(
    collection_name: str = "documents_langchain", recreate_collection: bool = False
) -> Qdrant:
    """
    Initialize and return a Qdrant vector store with Ollama embeddings.

    Args:
        collection_name: Name of the Qdrant collection to use
        recreate_collection: Whether to recreate the collection if it exists

    Returns:
        Initialized Qdrant vector store
    """
    # Initialize Qdrant client
    client = QdrantClient(
        host=QDRANT_HOST,
        port=QDRANT_REST_PORT,
    )

    # Initialize Ollama embeddings
    embeddings = OllamaEmbeddings(
        model=OLLAMA_EMBEDDING_MODEL,
        base_url="http://localhost:11434",  # Default Ollama URL
    )

    # Check if collection exists, if not create it
    collection_exists = False
    try:
        client.get_collection(collection_name)
        collection_exists = True
    except Exception:
        # Collection doesn't exist, we'll create it
        collection_exists = False

    if recreate_collection and collection_exists:
        client.delete_collection(collection_name)
        collection_exists = False

    # If collection doesn't exist, create it using the client directly
    if not collection_exists:
        # Create collection using the Qdrant client directly
        from qdrant_client.http.models import Distance, VectorParams
        import numpy as np

        # First, we need to determine the embedding size by creating a sample embedding
        sample_embedding = embeddings.embed_query("sample text for dimension detection")
        vector_size = len(sample_embedding)

        # Create the collection with appropriate vector size
        client.create_collection(
            collection_name=collection_name,
            vectors_config=VectorParams(size=vector_size, distance=Distance.COSINE),
        )

        # Now create the Qdrant instance connected to the newly created collection
        vector_store = Qdrant(
            client=client,
            collection_name=collection_name,
            embeddings=embeddings,
        )
    else:
        # Collection exists, just connect to it
        vector_store = Qdrant(
            client=client,
            collection_name=collection_name,
            embeddings=embeddings,
        )

    return vector_store


def add_documents_to_vector_store(
    vector_store: Qdrant, documents: list[Document], batch_size: int = 10
) -> None:
    """
    Add documents to the vector store.

    Args:
        vector_store: Initialized Qdrant vector store
        documents: List of documents to add
        batch_size: Number of documents to add in each batch
    """
    # Add documents to the vector store in batches
    for i in range(0, len(documents), batch_size):
        batch = documents[i : i + batch_size]
        vector_store.add_documents(batch)


def search_vector_store(vector_store: Qdrant, query: str, top_k: int = 5) -> list:
    """
    Search the vector store for similar documents.

    Args:
        vector_store: Initialized Qdrant vector store
        query: Query string to search for
        top_k: Number of top results to return

    Returns:
        List of similar documents
    """
    return vector_store.similarity_search(query, k=top_k)


# Just in case add possibility to connect via openai embedding, using openrouter api key.
# Comment this section, so it can be used in the future.
"""
# Alternative implementation using OpenAI embeddings via OpenRouter
# Uncomment and configure as needed

import os
from langchain_openai import OpenAIEmbeddings

OPENROUTER_API_KEY = os.getenv("OPENROUTER_API_KEY")
OPENROUTER_EMBEDDING_MODEL = os.getenv("OPENROUTER_EMBEDDING_MODEL", "openai/text-embedding-ada-002")

def initialize_vector_store_with_openrouter(
    collection_name: str = "documents_langchain"
) -> Qdrant:
    # Initialize Qdrant client
    client = QdrantClient(
        host=QDRANT_HOST,
        port=QDRANT_REST_PORT,
    )

    # Initialize OpenAI embeddings via OpenRouter
    embeddings = OpenAIEmbeddings(
        model=OPENROUTER_EMBEDDING_MODEL,
        openai_api_key=OPENROUTER_API_KEY,
        openai_api_base="https://openrouter.ai/api/v1"
    )

    # Create or get the vector store
    vector_store = Qdrant(
        client=client,
        collection_name=collection_name,
        embeddings=embeddings,
    )

    return vector_store
"""


if __name__ == "__main__":
    # Example usage
    print(
        f"Initializing vector store with Ollama embedding model: {OLLAMA_EMBEDDING_MODEL}"
    )
    vector_store = initialize_vector_store()
    print("Vector store initialized successfully!")
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`"""Vector storage module using Qdrant and Ollama embeddings for the RAG solution."""`

			`import os`
			`from typing import Optional`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
			`from dotenv import load_dotenv`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`from langchain_community.vectorstores import Qdrant`
			`from langchain_core.documents import Document`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`from langchain_ollama import OllamaEmbeddings`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`from qdrant_client import QdrantClient`

			`# Load environment variables`
			`load_dotenv()`

			`# Qdrant configuration`
			`QDRANT_HOST = os.getenv("QDRANT_HOST", "localhost")`
			`QDRANT_REST_PORT = int(os.getenv("QDRANT_REST_PORT", 6333))`
			`QDRANT_GRPC_PORT = int(os.getenv("QDRANT_GRPC_PORT", 6334))`

			`# Ollama embedding model configuration`
			`OLLAMA_EMBEDDING_MODEL = os.getenv("OLLAMA_EMBEDDING_MODEL", "nomic-embed-text")`


			`def initialize_vector_store(`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`collection_name: str = "documents_langchain", recreate_collection: bool = False`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`) -> Qdrant:`
			`"""`
			`Initialize and return a Qdrant vector store with Ollama embeddings.`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`Args:`
			`collection_name: Name of the Qdrant collection to use`
			`recreate_collection: Whether to recreate the collection if it exists`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`Returns:`
			`Initialized Qdrant vector store`
			`"""`
			`# Initialize Qdrant client`
			`client = QdrantClient(`
			`host=QDRANT_HOST,`
			`port=QDRANT_REST_PORT,`
			`)`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`# Initialize Ollama embeddings`
			`embeddings = OllamaEmbeddings(`
			`model=OLLAMA_EMBEDDING_MODEL,`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`base_url="http://localhost:11434", # Default Ollama URL`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`)`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
Working enrichment 2026-02-03 22:55:12 +03:00			`# Check if collection exists, if not create it`
			`collection_exists = False`
			`try:`
			`client.get_collection(collection_name)`
			`collection_exists = True`
			`except Exception:`
			`# Collection doesn't exist, we'll create it`
			`collection_exists = False`

			`if recreate_collection and collection_exists:`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`client.delete_collection(collection_name)`
Working enrichment 2026-02-03 22:55:12 +03:00			`collection_exists = False`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
Working enrichment 2026-02-03 22:55:12 +03:00			`# If collection doesn't exist, create it using the client directly`
			`if not collection_exists:`
			`# Create collection using the Qdrant client directly`
			`from qdrant_client.http.models import Distance, VectorParams`
			`import numpy as np`

			`# First, we need to determine the embedding size by creating a sample embedding`
			`sample_embedding = embeddings.embed_query("sample text for dimension detection")`
			`vector_size = len(sample_embedding)`

			`# Create the collection with appropriate vector size`
			`client.create_collection(`
			`collection_name=collection_name,`
			`vectors_config=VectorParams(size=vector_size, distance=Distance.COSINE),`
			`)`

			`# Now create the Qdrant instance connected to the newly created collection`
			`vector_store = Qdrant(`
			`client=client,`
			`collection_name=collection_name,`
			`embeddings=embeddings,`
			`)`
			`else:`
			`# Collection exists, just connect to it`
			`vector_store = Qdrant(`
			`client=client,`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`collection_name=collection_name,`
Working enrichment 2026-02-03 22:55:12 +03:00			`embeddings=embeddings,`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`)`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`return vector_store`


			`def add_documents_to_vector_store(`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`vector_store: Qdrant, documents: list[Document], batch_size: int = 10`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`) -> None:`
			`"""`
			`Add documents to the vector store.`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`Args:`
			`vector_store: Initialized Qdrant vector store`
			`documents: List of documents to add`
			`batch_size: Number of documents to add in each batch`
			`"""`
			`# Add documents to the vector store in batches`
			`for i in range(0, len(documents), batch_size):`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`batch = documents[i : i + batch_size]`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`vector_store.add_documents(batch)`


langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`def search_vector_store(vector_store: Qdrant, query: str, top_k: int = 5) -> list:`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`"""`
			`Search the vector store for similar documents.`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`Args:`
			`vector_store: Initialized Qdrant vector store`
			`query: Query string to search for`
			`top_k: Number of top results to return`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`Returns:`
			`List of similar documents`
			`"""`
			`return vector_store.similarity_search(query, k=top_k)`


			`# Just in case add possibility to connect via openai embedding, using openrouter api key.`
			`# Comment this section, so it can be used in the future.`
			`"""`
			`# Alternative implementation using OpenAI embeddings via OpenRouter`
			`# Uncomment and configure as needed`

			`import os`
			`from langchain_openai import OpenAIEmbeddings`

			`OPENROUTER_API_KEY = os.getenv("OPENROUTER_API_KEY")`
			`OPENROUTER_EMBEDDING_MODEL = os.getenv("OPENROUTER_EMBEDDING_MODEL", "openai/text-embedding-ada-002")`

			`def initialize_vector_store_with_openrouter(`
Working enrichment 2026-02-03 22:55:12 +03:00			`collection_name: str = "documents_langchain"`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`) -> Qdrant:`
			`# Initialize Qdrant client`
			`client = QdrantClient(`
			`host=QDRANT_HOST,`
			`port=QDRANT_REST_PORT,`
			`)`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`# Initialize OpenAI embeddings via OpenRouter`
			`embeddings = OpenAIEmbeddings(`
			`model=OPENROUTER_EMBEDDING_MODEL,`
			`openai_api_key=OPENROUTER_API_KEY,`
			`openai_api_base="https://openrouter.ai/api/v1"`
			`)`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`# Create or get the vector store`
			`vector_store = Qdrant(`
			`client=client,`
			`collection_name=collection_name,`
			`embeddings=embeddings,`
			`)`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`return vector_store`
			`"""`


			`if __name__ == "__main__":`
			`# Example usage`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`print(`
			`f"Initializing vector store with Ollama embedding model: {OLLAMA_EMBEDDING_MODEL}"`
			`)`
langchain vector storage connection and confguration 2026-02-03 20:42:09 +03:00			`vector_store = initialize_vector_store()`
langchain loading documents into vector storage 2026-02-03 20:52:08 +03:00			`print("Vector store initialized successfully!")`