From 2d33aace4977e3225be201a2c9499f46d3f1f44a Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Thu, 31 Jul 2025 23:16:46 +0800
Subject: [PATCH 01/17] init embedding

---
 docs/EMBEDDINGS.md                      |  76 ++++++
 examples/llm/embedding_block_example.py | 266 +++++++++++++++++++++
 quantmind/config/__init__.py            |   2 +
 quantmind/config/embedding.py           | 108 +++++++++
 quantmind/llm/__init__.py               |   3 +-
 quantmind/llm/embedding.py              | 305 ++++++++++++++++++++++++
 tests/llm/test_embedding.py             | 266 +++++++++++++++++++++
 7 files changed, 1025 insertions(+), 1 deletion(-)
 create mode 100644 docs/EMBEDDINGS.md
 create mode 100644 examples/llm/embedding_block_example.py
 create mode 100644 quantmind/config/embedding.py
 create mode 100644 quantmind/llm/embedding.py
 create mode 100644 tests/llm/test_embedding.py

diff --git a/docs/EMBEDDINGS.md b/docs/EMBEDDINGS.md
new file mode 100644
index 0000000..ff5176a
--- /dev/null
+++ b/docs/EMBEDDINGS.md
@@ -0,0 +1,76 @@
+# EmbeddingBlock Documentation
+
+## Overview
+
+The `EmbeddingBlock` class provides a flexible interface for generating text embeddings using LiteLLM. It supports multiple embedding providers through a single, consistent API.
+
+## Quick Start
+
+```python
+from quantmind.config import EmbeddingConfig
+from quantmind.llm import create_embedding_block
+
+# Simple configuration
+config = EmbeddingConfig(
+    model="text-embedding-ada-002"
+)
+
+embedding_block = create_embedding_block(config)
+embedding = embedding_block.generate_embedding("Sample text")
+```
+
+## Configuration
+
+### Required Parameters
+- `model`: Embedding model name (e.g., "text-embedding-ada-002")
+
+### Optional Parameters
+- `user`: Unique identifier for end-user
+- `dimensions`: Number of dimensions (OpenAI text-embedding-3+)
+- `encoding_format`: "float" or "base64" (default: "float")
+- `timeout`: Request timeout in seconds (default: 600)
+- `api_base`: Custom API endpoint
+- `api_version`: Azure-specific API version
+- `api_key`: API key for authentication
+- `api_type`: Type of API to use
+
+## Examples
+
+### Basic Usage
+```python
+config = EmbeddingConfig(model="text-embedding-ada-002")
+embedding_block = create_embedding_block(config)
+embedding = embedding_block.generate_embedding("Text to embed")
+```
+
+### With Custom Dimensions
+```python
+config = EmbeddingConfig(
+    model="text-embedding-3-small",
+    dimensions=512
+)
+```
+
+### Azure OpenAI
+```python
+config = EmbeddingConfig(
+    model="text-embedding-ada-002",
+    api_key="azure-key",
+    api_base="https://your-resource.openai.azure.com/",
+    api_version="2023-05-15",
+    api_type="azure"
+)
+```
+
+## Methods
+
+- `generate_embedding(text)`: Generate single embedding
+- `generate_embeddings(texts)`: Generate multiple embeddings
+- `batch_embed(texts, batch_size)`: Process large datasets
+- `test_connection()`: Test API connection
+- `get_info()`: Get configuration information
+- `get_embedding_dimension()`: Get embedding dimension
+
+## See Also
+
+- `examples/llm/embedding_block_example.py` for complete examples 
\ No newline at end of file
diff --git a/examples/llm/embedding_block_example.py b/examples/llm/embedding_block_example.py
new file mode 100644
index 0000000..76248ec
--- /dev/null
+++ b/examples/llm/embedding_block_example.py
@@ -0,0 +1,266 @@
+"""Example usage of EmbeddingBlock for different embedding providers."""
+
+import os
+from typing import List
+
+from quantmind.config import EmbeddingConfig
+from quantmind.llm import EmbeddingBlock, create_embedding_block
+from quantmind.utils.logger import get_logger
+
+logger = get_logger(__name__)
+
+
+def example_openai_embeddings():
+    """Example using OpenAI embeddings."""
+    print("\n=== OpenAI Embeddings Example ===")
+    
+    # Configuration for OpenAI embeddings
+    config = EmbeddingConfig(
+        model="text-embedding-ada-002",
+        api_key=os.getenv("OPENAI_API_KEY"),
+        timeout=30,
+        encoding_format="float",
+    )
+    
+    # Create embedding block
+    embedding_block = create_embedding_block(config)
+    
+    # Test connection
+    if embedding_block.test_connection():
+        print("✅ OpenAI connection successful")
+    else:
+        print("❌ OpenAI connection failed")
+        return
+    
+    # Generate single embedding
+    text = "This is a sample text for embedding generation."
+    embedding = embedding_block.generate_embedding(text)
+    
+    if embedding:
+        print(f"✅ Generated embedding with {len(embedding)} dimensions")
+        print(f"   First 5 values: {embedding[:5]}")
+    
+    # Generate multiple embeddings
+    texts = [
+        "First sample text for embedding.",
+        "Second sample text with different content.",
+        "Third sample text for batch processing."
+    ]
+    
+    embeddings = embedding_block.generate_embeddings(texts)
+    
+    if embeddings:
+        print(f"✅ Generated {len(embeddings)} embeddings")
+        for i, emb in enumerate(embeddings):
+            print(f"   Text {i+1}: {len(emb)} dimensions")
+    
+    # Get embedding information
+    info = embedding_block.get_info()
+    print(f"📊 Model info: {info['model']}")
+    print(f"📊 Provider: {info['provider']}")
+    print(f"📊 Dimension: {info['dimension']}")
+
+
+def example_openai_text_embedding_3():
+    """Example using OpenAI text-embedding-3 with custom dimensions."""
+    print("\n=== OpenAI Text-Embedding-3 Example ===")
+    
+    # Configuration for OpenAI text-embedding-3
+    config = EmbeddingConfig(
+        model="text-embedding-3-small",
+        api_key=os.getenv("OPENAI_API_KEY"),
+        dimensions=512,  # Custom dimension (default is 1536)
+        timeout=30,
+        encoding_format="float",
+    )
+    
+    # Create embedding block
+    embedding_block = create_embedding_block(config)
+    
+    # Test connection
+    if embedding_block.test_connection():
+        print("✅ OpenAI text-embedding-3 connection successful")
+    else:
+        print("❌ OpenAI text-embedding-3 connection failed")
+        return
+    
+    # Generate single embedding
+    text = "This is a sample text for embedding generation with custom dimensions."
+    embedding = embedding_block.generate_embedding(text)
+    
+    if embedding:
+        print(f"✅ Generated embedding with {len(embedding)} dimensions")
+        print(f"   First 5 values: {embedding[:5]}")
+    
+    # Generate multiple embeddings
+    texts = [
+        "First sample text for embedding.",
+        "Second sample text with different content.",
+        "Third sample text for batch processing."
+    ]
+    
+    embeddings = embedding_block.generate_embeddings(texts)
+    
+    if embeddings:
+        print(f"✅ Generated {len(embeddings)} embeddings")
+        for i, emb in enumerate(embeddings):
+            print(f"   Text {i+1}: {len(emb)} dimensions")
+    
+    # Get embedding information
+    info = embedding_block.get_info()
+    print(f"📊 Model info: {info['model']}")
+    print(f"📊 Provider: {info['provider']}")
+    print(f"📊 Dimension: {info['dimension']}")
+
+
+def example_azure_embeddings():
+    """Example using Azure OpenAI embeddings."""
+    print("\n=== Azure OpenAI Embeddings Example ===")
+    
+    # Configuration for Azure OpenAI embeddings
+    config = EmbeddingConfig(
+        model="text-embedding-ada-002",
+        api_key=os.getenv("AZURE_API_KEY"),
+        api_base=os.getenv("AZURE_API_BASE"),
+        api_version=os.getenv("AZURE_API_VERSION", "2023-05-15"),
+        api_type="azure",
+        timeout=30,
+        encoding_format="float",
+    )
+    
+    # Create embedding block
+    embedding_block = create_embedding_block(config)
+    
+    # Create embedding block
+    embedding_block = create_embedding_block(config)
+    
+    # Test connection
+    if embedding_block.test_connection():
+        print("✅ Azure OpenAI connection successful")
+    else:
+        print("❌ Azure OpenAI connection failed")
+        return
+    
+    # Generate single embedding
+    text = "This is a sample text for Azure OpenAI embedding generation."
+    embedding = embedding_block.generate_embedding(text)
+    
+    if embedding:
+        print(f"✅ Generated embedding with {len(embedding)} dimensions")
+        print(f"   First 5 values: {embedding[:5]}")
+    
+    # Generate multiple embeddings
+    texts = [
+        "First sample text for Azure embedding.",
+        "Second sample text with different content.",
+        "Third sample text for batch processing."
+    ]
+    
+    embeddings = embedding_block.generate_embeddings(texts)
+    
+    if embeddings:
+        print(f"✅ Generated {len(embeddings)} embeddings")
+        for i, emb in enumerate(embeddings):
+            print(f"   Text {i+1}: {len(emb)} dimensions")
+    
+    # Get embedding information
+    info = embedding_block.get_info()
+    print(f"📊 Model info: {info['model']}")
+    print(f"📊 Provider: {info['provider']}")
+    print(f"📊 Dimension: {info['dimension']}")
+
+
+def example_configuration_variants():
+    """Example showing different configuration variants."""
+    print("\n=== Configuration Variants Example ===")
+    
+    # Base configuration
+    base_config = EmbeddingConfig(
+        model="text-embedding-ada-002",
+        api_key=os.getenv("OPENAI_API_KEY"),
+        encoding_format="float",
+    )
+    
+    # Create variants with different parameters
+    fast_config = base_config.create_variant(
+        timeout=10,
+        retry_attempts=1
+    )
+    
+    conservative_config = base_config.create_variant(
+        timeout=120,
+        retry_attempts=5,
+        retry_delay=2.0
+    )
+    
+    print(f"Base config timeout: {base_config.timeout}s")
+    print(f"Fast config timeout: {fast_config.timeout}s")
+    print(f"Conservative config timeout: {conservative_config.timeout}s")
+    
+    # Test with temporary configuration
+    embedding_block = create_embedding_block(base_config)
+    
+    with embedding_block.temporary_config(timeout=5):
+        print("Using temporary configuration with 5s timeout")
+        # Any embedding operations here will use the temporary config
+        embedding = embedding_block.generate_embedding("Test with temp config")
+        if embedding:
+            print("✅ Temporary configuration worked")
+
+
+def example_error_handling():
+    """Example showing error handling and fallbacks."""
+    print("\n=== Error Handling Example ===")
+    
+    # Try with invalid API key
+    config = EmbeddingConfig(
+        model="text-embedding-ada-002",
+        api_key="invalid_key",
+        timeout=5,
+    )
+    
+    embedding_block = create_embedding_block(config)
+    
+    # This should fail gracefully
+    embedding = embedding_block.generate_embedding("Test text")
+    if embedding is None:
+        print("✅ Gracefully handled invalid API key")
+    
+    # Try with non-existent model
+    config = EmbeddingConfig(
+        model="non-existent-model",
+        timeout=5,
+    )
+    
+    try:
+        embedding_block = create_embedding_block(config)
+        print("❌ Should have failed with non-existent model")
+    except Exception as e:
+        print(f"✅ Gracefully handled non-existent model: {e}")
+
+
+def main():
+    """Run all embedding examples."""
+    print("🚀 EmbeddingBlock Examples")
+    print("=" * 50)
+    
+    # Run examples based on available API keys
+    if os.getenv("OPENAI_API_KEY"):
+        example_openai_embeddings()
+        example_openai_text_embedding_3()
+    else:
+        print("\n⚠️  Skipping OpenAI examples - OPENAI_API_KEY not set")
+    
+    if os.getenv("AZURE_API_KEY") and os.getenv("AZURE_API_BASE"):
+        example_azure_embeddings()
+    else:
+        print("\n⚠️  Skipping Azure example - AZURE_API_KEY or AZURE_API_BASE not set")
+    
+    example_configuration_variants()
+    example_error_handling()
+    
+    print("\n✅ All examples completed!")
+
+
+if __name__ == "__main__":
+    main() 
\ No newline at end of file
diff --git a/quantmind/config/__init__.py b/quantmind/config/__init__.py
index d20d111..49901c9 100644
--- a/quantmind/config/__init__.py
+++ b/quantmind/config/__init__.py
@@ -7,6 +7,7 @@
     SummaryFlowConfig,
 )
 from .llm import LLMConfig
+from .embedding import EmbeddingConfig
 from .parsers import LlamaParserConfig, PDFParserConfig
 from .settings import (
     Setting,
@@ -27,6 +28,7 @@
     "Setting",
     # LLM Configuration
     "LLMConfig",
+    "EmbeddingConfig",
     # Tagger Configurations
     "LLMTaggerConfig",
     # Parser Configurations
diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
new file mode 100644
index 0000000..e3f7587
--- /dev/null
+++ b/quantmind/config/embedding.py
@@ -0,0 +1,108 @@
+"""Embedding configuration for QuantMind."""
+
+from typing import Any, Dict, Optional
+
+from pydantic import BaseModel, Field, field_validator
+
+
+
+class EmbeddingConfig(BaseModel):
+    """Configuration for EmbeddingBlock."""
+
+    # Model configuration
+    model: str = Field(
+        default="text-embedding-ada-002", description="Embedding model name"
+    )
+
+    # Optional parameters
+    user: Optional[str] = Field(
+        default=None, description="A unique identifier representing your end-user"
+    )
+    dimensions: Optional[int] = Field(
+        default=None, description="The number of dimensions the resulting output embeddings should have. Only supported in OpenAI/Azure text-embedding-3 and later models"
+    )
+    encoding_format: str = Field(
+        default="float", description="The format to return the embeddings in. Can be either 'float' or 'base64'"
+    )
+    timeout: int = Field(
+        default=600, description="The maximum time, in seconds, to wait for the API to respond"
+    )
+    api_base: Optional[str] = Field(
+        default=None, description="The api endpoint you want to call the model with"
+    )
+    api_version: Optional[str] = Field(
+        default=None, description="(Azure-specific) the api version for the call"
+    )
+    api_key: Optional[str] = Field(
+        default=None, description="The API key to authenticate and authorize requests. If not provided, the default API key is used"
+    )
+    api_type: Optional[str] = Field(
+        default=None, description="The type of API to use"
+    )
+
+    @field_validator("model")
+    def validate_model(cls, v):
+        """Validate model name format."""
+        if not v or not isinstance(v, str):
+            raise ValueError("Model name must be a non-empty string")
+        return v.strip()
+
+    @field_validator("encoding_format")
+    def validate_encoding_format(cls, v):
+        """Validate encoding format."""
+        if v not in ["float", "base64"]:
+            raise ValueError("encoding_format must be 'float' or 'base64'")
+        return v
+
+    def get_litellm_params(self) -> Dict[str, Any]:
+        """Get parameters formatted for LiteLLM embedding."""
+        params = {
+            "model": self.model,
+            "encoding_format": self.encoding_format,
+            "timeout": self.timeout,
+        }
+
+        # Add optional parameters if provided
+        if self.user:
+            params["user"] = self.user
+        if self.dimensions:
+            params["dimensions"] = self.dimensions
+        if self.api_base:
+            params["api_base"] = self.api_base
+        if self.api_version:
+            params["api_version"] = self.api_version
+        if self.api_key:
+            params["api_key"] = self.api_key
+        if self.api_type:
+            params["api_type"] = self.api_type
+
+        return params
+
+    def get_provider_type(self) -> str:
+        """Extract provider type from model name."""
+        model_lower = self.model.lower()
+        
+        # OpenAI models
+        if (model_lower.startswith("text-embedding-") or 
+            model_lower.startswith("openai/") or
+            "ada" in model_lower or "3" in model_lower):
+            return "openai"
+        
+        # Azure models
+        elif "azure" in model_lower:
+            return "azure"
+        
+        # Cohere models
+        elif (model_lower.startswith("embed-") or
+              model_lower.startswith("cohere/")):
+            return "cohere"
+        
+        # Default to openai for unknown models
+        else:
+            return "unknown"
+
+    def create_variant(self, **overrides) -> "EmbeddingConfig":
+        """Create a variant of this config with parameter overrides."""
+        current_dict = self.model_dump()
+        current_dict.update(overrides)
+        return EmbeddingConfig(**current_dict)
diff --git a/quantmind/llm/__init__.py b/quantmind/llm/__init__.py
index caab46f..20a9b6b 100644
--- a/quantmind/llm/__init__.py
+++ b/quantmind/llm/__init__.py
@@ -1,8 +1,9 @@
 """LLM module for QuantMind - Basic LLM functionality."""
 
 from .block import LLMBlock, create_llm_block
+from .embedding import EmbeddingBlock, create_embedding_block
 
 __all__ = [
     "LLMBlock",
-    "create_llm_block",
+    "create_llm_block"
 ]
diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
new file mode 100644
index 0000000..10487ff
--- /dev/null
+++ b/quantmind/llm/embedding.py
@@ -0,0 +1,305 @@
+"""EmbeddingBlock - A reusable Embedding function block using LiteLLM."""
+
+import os
+import time
+import numpy as np
+from contextlib import contextmanager
+from typing import Any, Dict, List, Optional
+
+from quantmind.utils.logger import get_logger
+
+from ..config import EmbeddingConfig
+
+logger = get_logger(__name__)
+
+try:
+    import litellm
+    from litellm import embedding
+    
+    LITELLM_AVAILABLE = True
+except ImportError:
+    LITELLM_AVAILABLE = False
+
+class EmbeddingBlock:
+	"""A reusable Embedding function block using LiteLLM.
+	
+	EmbeddingBlock provides a consistent interface for generating embeddings across different providers (OpenAI, Anthropic, etc.).
+	
+	Unlike workflows, EmbeddingBlock focuses on providing basic embedding capabilities without business logic."""
+	
+	def __init__(self, config: EmbeddingConfig):
+		"""Initialize the EmbeddingBlock with configuration.
+		
+		Args:
+			config: Embedding configuration
+		
+		Raises:
+			ImportError: If LiteLLM is not available.
+		"""
+		if not LITELLM_AVAILABLE:
+			raise ImportError("litellm is required for EmbeddingBlock but not installed.")
+		
+		self.config = config
+		self._setup_litellm()
+		
+		logger.info(f"Initialized EmbeddingBlock with model: {config.model}")
+
+	def _setup_litellm(self):
+		"""Setup LiteLLM configuration."""
+		# Set global LiteLLM settings
+		litellm.set_verbose = False  # Disable verbose logging by default
+		
+		# Configure retries
+		litellm.num_retries = self.config.retry_attempts
+		litellm.request_timeout = self.config.timeout
+		
+		# Set API key as environment variable if provided
+		if self.config.api_key:
+			provider_type = self.config.get_provider_type()
+			if provider_type == "openai":
+				os.environ["OPENAI_API_KEY"] = self.config.api_key
+			elif provider_type == "azure":
+				os.environ["AZURE_API_KEY"] = self.config.api_key
+			elif provider_type == "cohere":
+				os.environ["COHERE_API_KEY"] = self.config.api_key
+		
+		logger.debug(f"Configured LiteLLM for provider: {self.config.get_provider_type()}")
+	
+	
+	def generate_embedding(self, text: str, **kwargs) -> Optional[List[float]]:
+		"""Generate embedding using the configured Embedding model.
+
+		Args:
+			text (str): The input text to embed.
+			**kwargs: Additional parameters to override config
+
+		Returns:
+			List[float]: The embedding vector as a list of floats, or None if failed.
+		"""
+		try:
+			# Get LiteLLM parameters
+			params = self.config.get_litellm_params()
+			params.update(kwargs)  # Allow runtime overrides
+			
+			# Add input text
+			params["input"] = text
+			
+			# Call LiteLLM embedding
+			response = self._call_with_retry(params)
+			
+			if response and hasattr(response, 'data'):
+				# Extract embedding from response
+				embedding_data = response.data[0] if isinstance(response.data, list) else response.data
+				return embedding_data.embedding
+			
+			return None
+			
+		except Exception as e:
+			logger.error(f"Failed to generate embedding: {e}")
+			return None
+
+	def generate_embeddings(self, texts: List[str], **kwargs) -> Optional[List[List[float]]]:
+		"""Generate embeddings for multiple texts.
+
+		Args:
+			texts (List[str]): List of input texts to embed.
+			**kwargs: Additional parameters to override config
+
+		Returns:
+			List[List[float]]: List of embedding vectors, or None if failed.
+		"""
+		try:
+			# Get LiteLLM parameters
+			params = self.config.get_litellm_params()
+			params.update(kwargs)  # Allow runtime overrides
+			
+			# Add input texts
+			params["input"] = texts
+			
+			# Call LiteLLM embedding
+			response = self._call_with_retry(params)
+			
+			if response and hasattr(response, 'data'):
+				# Extract embeddings from response
+				return [item.embedding for item in response.data]
+			
+			return None
+			
+		except Exception as e:
+			logger.error(f"Failed to generate embeddings: {e}")
+			return None
+	
+	def _call_with_retry(self, params: Dict[str, Any]) -> Optional[Any]:
+		"""Call LiteLLM embedding with retry logic.
+
+		Args:
+			params (Dict[str, Any]): The parameters to pass to the embedding function.
+
+		Returns:
+			Optional[Any]: The embedding result or None if failed.
+		"""
+		last_exception = None
+		for attempt in range(self.config.retry_attempts + 1):
+			try:
+				logger.debug(
+					f"Embedding call attempt {attempt + 1}/{self.config.retry_attempts + 1}"
+				)
+				
+				# Extract input from params and remove it for the embedding call
+				input_text = params.pop("input")
+				response = embedding(model=self.config.model, input=input_text, **params)
+
+				if hasattr(response, "usage") and response.usage:
+					logger.debug(f"Token usage: {response.usage}")
+				return response
+			except Exception as e:
+				last_exception = e
+				logger.warning(f"Embedding call attempt {attempt + 1} failed: {e}")
+
+				if attempt < self.config.retry_attempts:
+					time.sleep(self.config.retry_delay)
+				else:
+					logger.error(
+						f"All {self.config.retry_attempts + 1} attempts failed"
+					)
+		
+		# Log final error
+		if last_exception:
+			logger.error(f"Final error: {last_exception}")
+
+		return None
+
+
+	def test_connection(self) -> bool:
+		"""Test if the embedding connection is working.
+
+        Returns:
+            True if connection is working, False otherwise
+        """
+		try:
+			response = self.generate_embedding(
+				"Hello, this is a test for embedding generation. Please respond with 'OK'."
+			)
+			return response is not None and len(response) > 0
+		except Exception as e:
+			logger.error(f"Connection test failed: {e}")
+			return False
+
+
+	def get_info(self) -> Dict[str, Any]:
+		"""Get information about the embedding block.
+
+		Returns:
+			Dictionary with embedding block information
+		"""
+		info = {
+			"model": self.config.model,
+			"provider": self.config.get_provider_type(),
+			"dimension": self.get_embedding_dimension(),
+			"config": self.config.model_dump(),
+		}
+		return info
+
+	def get_embedding_dimension(self) -> Optional[int]:
+		"""Get the dimension of embeddings generated by this model.
+
+		Returns:
+			Embedding dimension or None if not available
+		"""
+		# First check if dimensions is specified in config
+		if self.config.dimensions:
+			return self.config.dimensions
+		
+		try:
+			# Try to get dimension by generating a test embedding
+			test_embedding = self.generate_embedding("test")
+			return len(test_embedding) if test_embedding else None
+		except Exception as e:
+			logger.error(f"Failed to get embedding dimension: {e}")
+			return None
+
+	def update_config(self, **kwargs) -> None:
+		"""Update the embedding configuration.
+
+		Args:
+			**kwargs: Configuration parameters to update
+		"""
+		for key, value in kwargs.items():
+			if hasattr(self.config, key):
+				setattr(self.config, key, value)
+
+		logger.info(f"Updated embedding configuration: {kwargs}")
+
+	@contextmanager
+	def temporary_config(self, **kwargs):
+		"""Temporarily modify configuration for a context.
+
+		Args:
+			**kwargs: Temporary configuration parameters
+
+		Yields:
+			Self with temporary configuration
+		"""
+		original_config = {}
+		for key, value in kwargs.items():
+			if hasattr(self.config, key):
+				original_config[key] = getattr(self.config, key)
+				setattr(self.config, key, value)
+
+		try:
+			yield self
+		finally:
+			# Restore original configuration
+			for key, value in original_config.items():
+				setattr(self.config, key, value)
+
+	def batch_embed(
+		self, 
+		texts: List[str], 
+		batch_size: int = 32,
+		**kwargs
+	) -> Optional[List[List[float]]]:
+		"""Generate embeddings in batches for large datasets.
+
+		Args:
+			texts: List of texts to embed
+			batch_size: Number of texts to process in each batch
+			**kwargs: Additional parameters for embedding generation
+
+		Returns:
+			List of embedding vectors or None if failed
+		"""
+		try:
+			all_embeddings = []
+			
+			for i in range(0, len(texts), batch_size):
+				batch = texts[i:i + batch_size]
+				batch_embeddings = self.generate_embeddings(batch, **kwargs)
+				
+				if batch_embeddings is None:
+					logger.error(f"Failed to generate embeddings for batch {i//batch_size}")
+					return None
+				
+				all_embeddings.extend(batch_embeddings)
+				
+				# Add delay between batches if specified
+				if self.config.retry_delay > 0 and i + batch_size < len(texts):
+					time.sleep(self.config.retry_delay)
+
+			return all_embeddings
+
+		except Exception as e:
+			logger.error(f"Batch embedding failed: {e}")
+			return None
+
+
+def create_embedding_block(config: EmbeddingConfig) -> EmbeddingBlock:
+	"""Create an EmbeddingBlock instance.
+
+	Args:
+		config: Embedding configuration
+
+	Returns:
+		Configured EmbeddingBlock instance
+	"""
+	return EmbeddingBlock(config)
\ No newline at end of file
diff --git a/tests/llm/test_embedding.py b/tests/llm/test_embedding.py
new file mode 100644
index 0000000..88bc673
--- /dev/null
+++ b/tests/llm/test_embedding.py
@@ -0,0 +1,266 @@
+"""Tests for EmbeddingBlock."""
+
+import unittest
+from unittest.mock import Mock, patch
+
+from quantmind.config import EmbeddingConfig
+from quantmind.llm import EmbeddingBlock, create_embedding_block
+
+
+class TestEmbeddingConfig(unittest.TestCase):
+    """Test EmbeddingConfig class."""
+
+    def test_default_config(self):
+        """Test default configuration."""
+        config = EmbeddingConfig()
+        
+        self.assertEqual(config.model, "text-embedding-ada-002")
+        self.assertIsNone(config.api_key)
+        self.assertEqual(config.timeout, 60)
+        self.assertEqual(config.batch_size, 32)
+        self.assertTrue(config.normalize)
+
+    def test_custom_config(self):
+        """Test custom configuration."""
+        config = EmbeddingConfig(
+            model="sentence-transformers/all-MiniLM-L6-v2",
+            api_key="test_key",
+            timeout=30,
+            batch_size=16,
+            normalize=False,
+            device="cuda"
+        )
+        
+        self.assertEqual(config.model, "sentence-transformers/all-MiniLM-L6-v2")
+        self.assertEqual(config.api_key, "test_key")
+        self.assertEqual(config.timeout, 30)
+        self.assertEqual(config.batch_size, 16)
+        self.assertFalse(config.normalize)
+        self.assertEqual(config.device, "cuda")
+
+    def test_provider_detection(self):
+        """Test provider type detection."""
+        # OpenAI models
+        config = EmbeddingConfig(model="text-embedding-ada-002")
+        self.assertEqual(config.get_provider_type(), "openai")
+        
+        config = EmbeddingConfig(model="text-embedding-3-small")
+        self.assertEqual(config.get_provider_type(), "openai")
+        
+        # SentenceTransformers models
+        config = EmbeddingConfig(model="sentence-transformers/all-MiniLM-L6-v2")
+        self.assertEqual(config.get_provider_type(), "sentence_transformers")
+        
+        config = EmbeddingConfig(model="all-MiniLM-L6-v2")
+        self.assertEqual(config.get_provider_type(), "sentence_transformers")
+        
+        # Cohere models
+        config = EmbeddingConfig(model="embed-english-v3.0")
+        self.assertEqual(config.get_provider_type(), "cohere")
+        
+        config = EmbeddingConfig(model="cohere/embed-multilingual-v3.0")
+        self.assertEqual(config.get_provider_type(), "cohere")
+
+    def test_create_variant(self):
+        """Test creating configuration variants."""
+        base_config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            timeout=60,
+            batch_size=32
+        )
+        
+        variant = base_config.create_variant(
+            timeout=30,
+            batch_size=16
+        )
+        
+        self.assertEqual(variant.model, "text-embedding-ada-002")
+        self.assertEqual(variant.timeout, 30)
+        self.assertEqual(variant.batch_size, 16)
+
+    def test_validation(self):
+        """Test configuration validation."""
+        # Test invalid model
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(model="")
+        
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(model=None)
+        
+        # Test invalid API key
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(api_key=123)
+
+
+class TestEmbeddingBlock(unittest.TestCase):
+    """Test EmbeddingBlock class."""
+
+    def setUp(self):
+        """Set up test fixtures."""
+        self.config = EmbeddingConfig(
+            model="sentence-transformers/all-MiniLM-L6-v2",
+            normalize=True
+        )
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_initialization(self, mock_sentence_transformer):
+        """Test EmbeddingBlock initialization."""
+        mock_model = Mock()
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        
+        self.assertEqual(embedding_block.config, self.config)
+        mock_sentence_transformer.assert_called_once_with(self.config.model)
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', False)
+    def test_initialization_missing_dependency(self):
+        """Test initialization with missing dependency."""
+        with self.assertRaises(ImportError):
+            EmbeddingBlock(self.config)
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_generate_embedding(self, mock_sentence_transformer):
+        """Test single embedding generation."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [0.1, 0.2, 0.3, 0.4, 0.5]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        embedding = embedding_block.generate_embedding("test text")
+        
+        self.assertEqual(embedding, [0.1, 0.2, 0.3, 0.4, 0.5])
+        mock_model.encode.assert_called_once_with("test text")
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_generate_embeddings(self, mock_sentence_transformer):
+        """Test multiple embedding generation."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [
+            [0.1, 0.2, 0.3],
+            [0.4, 0.5, 0.6]
+        ]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        embeddings = embedding_block.generate_embeddings(["text1", "text2"])
+        
+        self.assertEqual(embeddings, [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]])
+        mock_model.encode.assert_called_once_with(["text1", "text2"])
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_get_embedding_dimension(self, mock_sentence_transformer):
+        """Test getting embedding dimension."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [0.1, 0.2, 0.3, 0.4, 0.5]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        dimension = embedding_block.get_embedding_dimension()
+        
+        self.assertEqual(dimension, 5)
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_test_connection(self, mock_sentence_transformer):
+        """Test connection testing."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [0.1, 0.2, 0.3]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        result = embedding_block.test_connection()
+        
+        self.assertTrue(result)
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_get_info(self, mock_sentence_transformer):
+        """Test getting embedding block information."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [0.1, 0.2, 0.3]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        info = embedding_block.get_info()
+        
+        self.assertEqual(info["model"], self.config.model)
+        self.assertEqual(info["provider"], "sentence_transformers")
+        self.assertEqual(info["dimension"], 3)
+        self.assertIn("config", info)
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_update_config(self, mock_sentence_transformer):
+        """Test configuration updates."""
+        mock_model = Mock()
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        
+        # Update timeout
+        embedding_block.update_config(timeout=30)
+        self.assertEqual(embedding_block.config.timeout, 30)
+        
+        # Update model (should reinitialize)
+        embedding_block.update_config(model="sentence-transformers/all-mpnet-base-v2")
+        self.assertEqual(embedding_block.config.model, "sentence-transformers/all-mpnet-base-v2")
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_temporary_config(self, mock_sentence_transformer):
+        """Test temporary configuration context manager."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [0.1, 0.2, 0.3]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        original_timeout = embedding_block.config.timeout
+        
+        with embedding_block.temporary_config(timeout=10):
+            self.assertEqual(embedding_block.config.timeout, 10)
+        
+        # Should be restored
+        self.assertEqual(embedding_block.config.timeout, original_timeout)
+
+    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
+    @patch('quantmind.llm.embedding.SentenceTransformer')
+    def test_batch_embed(self, mock_sentence_transformer):
+        """Test batch embedding processing."""
+        mock_model = Mock()
+        mock_model.encode.return_value = [[0.1, 0.2], [0.3, 0.4]]
+        mock_sentence_transformer.return_value = mock_model
+        
+        embedding_block = EmbeddingBlock(self.config)
+        texts = ["text1", "text2", "text3", "text4"]
+        
+        embeddings = embedding_block.batch_embed(texts, batch_size=2)
+        
+        self.assertEqual(len(embeddings), 4)
+        # Should have been called twice (2 batches of 2)
+        self.assertEqual(mock_model.encode.call_count, 2)
+
+
+class TestCreateEmbeddingBlock(unittest.TestCase):
+    """Test create_embedding_block function."""
+
+    def test_create_embedding_block(self):
+        """Test creating embedding block."""
+        config = EmbeddingConfig(
+            model="sentence-transformers/all-MiniLM-L6-v2"
+        )
+        
+        with patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True):
+            with patch('quantmind.llm.embedding.SentenceTransformer'):
+                embedding_block = create_embedding_block(config)
+                
+                self.assertIsInstance(embedding_block, EmbeddingBlock)
+                self.assertEqual(embedding_block.config, config)
+
+
+if __name__ == "__main__":
+    unittest.main()
\ No newline at end of file

From aac5db4800eceb360400c3b8fa7ee0bfe131233a Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Thu, 31 Jul 2025 23:48:13 +0800
Subject: [PATCH 02/17] add wiki/embedding.md

---
 wiki/embedding.md | 326 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 326 insertions(+)
 create mode 100644 wiki/embedding.md

diff --git a/wiki/embedding.md b/wiki/embedding.md
new file mode 100644
index 0000000..854c151
--- /dev/null
+++ b/wiki/embedding.md
@@ -0,0 +1,326 @@
+# 🌟 Embedding Systems in QuantMind 🌟
+
+## 📋 Table of Contents
+
+<details>
+  <summary><strong>📜 Contents</strong></summary>
+  <ol>
+    <li><a href="#overview">📌 Overview</a></li>
+    <li><a href="#theoretical-background">📌 Theoretical Background</a></li>
+    <li><a href="#architecture">📌 Architecture</a></li>
+    <li><a href="#configuration">📌 Configuration</a></li>
+    <li><a href="#usage-examples">📌 Usage Examples</a></li>
+    <li><a href="#advanced-features">📌 Advanced Features</a></li>
+    <li><a href="#best-practices">📌 Best Practices</a></li>
+  </ol>
+</details>
+
+## 📌 Overview
+
+Embeddings are numerical representations of text that capture semantic meaning in high-dimensional vector spaces. In quantitative finance, embeddings enable:
+
+- **Document Analysis**: Converting financial reports into searchable vectors
+- **Semantic Search**: Finding similar financial documents
+- **Content Clustering**: Grouping related financial information
+- **Feature Engineering**: Creating numerical features from textual data
+
+QuantMind provides a flexible embedding system through the `EmbeddingBlock` class, supporting multiple providers via a unified interface.
+
+## 📌 Theoretical Background
+
+### What are Embeddings?
+
+Embeddings map discrete objects (words, sentences, documents) to continuous vector spaces where:
+- **Similar objects** are positioned close to each other
+- **Mathematical operations** have semantic meaning
+- **Dimensionality** typically ranges from 100 to 1536 dimensions
+
+### Supported Models
+
+| Model | Dimensions | Use Case | Provider |
+|-------|------------|----------|----------|
+| `text-embedding-ada-002` | 1536 | General purpose | OpenAI |
+| `text-embedding-3-small` | 1536 | High performance | OpenAI |
+| `text-embedding-3-large` | 3072 | Maximum quality | OpenAI |
+| `embed-english-v3.0` | 1024 | Multilingual | Cohere |
+
+## 📌 Architecture
+
+### Core Components
+
+```python
+from quantmind.config import EmbeddingConfig
+from quantmind.llm import EmbeddingBlock, create_embedding_block
+```
+
+#### EmbeddingConfig
+Manages all embedding parameters:
+
+```python
+class EmbeddingConfig(BaseModel):
+    model: str = "text-embedding-ada-002"
+    user: Optional[str] = None
+    dimensions: Optional[int] = None
+    encoding_format: str = "float"
+    timeout: int = 600
+    api_base: Optional[str] = None
+    api_version: Optional[str] = None
+    api_key: Optional[str] = None
+    api_type: Optional[str] = None
+```
+
+#### EmbeddingBlock
+Main interface for generating embeddings:
+
+```python
+class EmbeddingBlock:
+    def generate_embedding(self, text: str) -> Optional[List[float]]
+    def generate_embeddings(self, texts: List[str]) -> Optional[List[List[float]]]
+    def batch_embed(self, texts: List[str], batch_size: int = 100) -> List[List[float]]
+    def test_connection(self) -> bool
+    def get_info(self) -> Dict[str, Any]
+```
+
+## 📌 Configuration
+
+### Basic Setup
+
+```python
+from quantmind.config import EmbeddingConfig
+
+# Simple configuration
+config = EmbeddingConfig(
+    model="text-embedding-ada-002",
+    api_key="your-api-key"
+)
+```
+
+### Advanced Configuration
+
+```python
+# Custom dimensions (OpenAI text-embedding-3+)
+config = EmbeddingConfig(
+    model="text-embedding-3-small",
+    dimensions=512,  # Reduce from default 1536
+    encoding_format="float",
+    timeout=30
+)
+
+# Azure OpenAI
+config = EmbeddingConfig(
+    model="text-embedding-ada-002",
+    api_key="azure-key",
+    api_base="https://your-resource.openai.azure.com/",
+    api_version="2023-05-15",
+    api_type="azure"
+)
+```
+
+## 📌 Usage Examples
+
+### Basic Embedding Generation
+
+```python
+from quantmind.config import EmbeddingConfig
+from quantmind.llm import create_embedding_block
+
+# Create configuration
+config = EmbeddingConfig(
+    model="text-embedding-ada-002",
+    api_key=os.getenv("OPENAI_API_KEY")
+)
+
+# Create embedding block
+embedding_block = create_embedding_block(config)
+
+# Generate single embedding
+text = "Apple Inc. reported strong quarterly earnings with revenue growth of 15%."
+embedding = embedding_block.generate_embedding(text)
+
+if embedding:
+    print(f"Generated embedding with {len(embedding)} dimensions")
+    print(f"First 5 values: {embedding[:5]}")
+```
+
+### Batch Processing
+
+```python
+# Generate multiple embeddings
+texts = [
+    "Apple Inc. reported strong quarterly earnings.",
+    "Microsoft Corp. announced new AI initiatives.",
+    "Tesla Inc. delivered record vehicle production.",
+    "Amazon.com Inc. expanded cloud services."
+]
+
+embeddings = embedding_block.generate_embeddings(texts)
+
+if embeddings:
+    print(f"Generated {len(embeddings)} embeddings")
+    for i, emb in enumerate(embeddings):
+        print(f"Text {i+1}: {len(emb)} dimensions")
+```
+
+### Semantic Similarity
+
+```python
+import numpy as np
+from sklearn.metrics.pairwise import cosine_similarity
+
+def calculate_similarity(text1: str, text2: str) -> float:
+    """Calculate semantic similarity between two texts."""
+    embeddings = embedding_block.generate_embeddings([text1, text2])
+    
+    if embeddings and len(embeddings) == 2:
+        similarity = cosine_similarity(
+            [embeddings[0]], 
+            [embeddings[1]]
+        )[0][0]
+        return similarity
+    
+    return 0.0
+
+# Example usage
+text1 = "Apple's iPhone sales exceeded expectations"
+text2 = "iPhone revenue surpassed analyst predictions"
+similarity = calculate_similarity(text1, text2)
+print(f"Similarity: {similarity:.3f}")
+```
+
+## 📌 Advanced Features
+
+### Custom Dimensions
+
+```python
+# Reduce embedding dimensions for efficiency
+config = EmbeddingConfig(
+    model="text-embedding-3-small",
+    dimensions=512  # Reduce from 1536 to 512
+)
+
+embedding_block = create_embedding_block(config)
+embedding = embedding_block.generate_embedding("Sample text")
+print(f"Reduced dimensions: {len(embedding)}")  # 512
+```
+
+### Connection Testing
+
+```python
+# Test API connection before processing
+if embedding_block.test_connection():
+    print("✅ API connection successful")
+    # Proceed with embedding generation
+else:
+    print("❌ API connection failed")
+    # Handle error or retry
+```
+
+### Configuration Information
+
+```python
+# Get detailed configuration information
+info = embedding_block.get_info()
+print(f"Model: {info['model']}")
+print(f"Provider: {info['provider']}")
+print(f"Dimensions: {info['dimension']}")
+print(f"Format: {info['encoding_format']}")
+```
+
+## 📌 Best Practices
+
+### 1. Model Selection
+
+| Use Case | Recommended Model | Reasoning |
+|----------|------------------|-----------|
+| **General purpose** | `text-embedding-ada-002` | Good balance of quality and cost |
+| **High performance** | `text-embedding-3-small` | Better quality, slightly higher cost |
+| **Maximum quality** | `text-embedding-3-large` | Best quality, highest cost |
+| **Multilingual** | `embed-multilingual-v3.0` | Support for multiple languages |
+
+### 2. Batch Processing
+
+```python
+# Efficient batch processing
+def efficient_batch_embedding(texts: List[str], batch_size: int = 100):
+    """Process texts in optimal batches."""
+    all_embeddings = []
+    
+    for i in range(0, len(texts), batch_size):
+        batch = texts[i:i + batch_size]
+        try:
+            batch_embeddings = embedding_block.generate_embeddings(batch)
+            if batch_embeddings:
+                all_embeddings.extend(batch_embeddings)
+        except Exception as e:
+            print(f"Error processing batch {i//batch_size + 1}: {e}")
+    
+    return all_embeddings
+```
+
+### 3. Error Handling
+
+```python
+def robust_embedding_generation(text: str, max_retries: int = 3):
+    """Generate embedding with retry logic."""
+    for attempt in range(max_retries):
+        try:
+            embedding = embedding_block.generate_embedding(text)
+            if embedding:
+                return embedding
+        except Exception as e:
+            print(f"Attempt {attempt + 1} failed: {e}")
+            if attempt < max_retries - 1:
+                time.sleep(2 ** attempt)  # Exponential backoff
+    
+    return None
+```
+
+### 4. Caching
+
+```python
+import hashlib
+import pickle
+import os
+
+class CachedEmbeddingBlock:
+    def __init__(self, embedding_block, cache_dir: str = "embedding_cache"):
+        self.embedding_block = embedding_block
+        self.cache_dir = cache_dir
+        os.makedirs(cache_dir, exist_ok=True)
+    
+    def get_embedding(self, text: str) -> Optional[List[float]]:
+        # Create cache key
+        text_hash = hashlib.md5(text.encode()).hexdigest()
+        cache_file = os.path.join(self.cache_dir, f"{text_hash}.pkl")
+        
+        # Check cache
+        if os.path.exists(cache_file):
+            with open(cache_file, 'rb') as f:
+                return pickle.load(f)
+        
+        # Generate embedding
+        embedding = self.embedding_block.generate_embedding(text)
+        
+        # Cache result
+        if embedding:
+            with open(cache_file, 'wb') as f:
+                pickle.dump(embedding, f)
+        
+        return embedding
+```
+
+## 📚 Related Documentation
+
+- [EmbeddingBlock API Reference](../docs/EMBEDDINGS.md)
+- [Examples](../examples/llm/embedding_block_example.py)
+- [Configuration Guide](../quantmind/config/embedding.py)
+
+## 🔗 External Resources
+
+- [OpenAI Embeddings Guide](https://platform.openai.com/docs/guides/embeddings)
+- [Cohere Embeddings](https://docs.cohere.com/docs/embeddings)
+- [Vector Similarity Search](https://www.pinecone.io/learn/vector-similarity-search/)
+
+---
+
+*Last updated: January 2025* 
\ No newline at end of file

From 30b2635ca3bc7a6577ea346afd5489ee156b821a Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Thu, 31 Jul 2025 23:52:36 +0800
Subject: [PATCH 03/17] update __init__.py

---
 quantmind/llm/__init__.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/quantmind/llm/__init__.py b/quantmind/llm/__init__.py
index 20a9b6b..55ad035 100644
--- a/quantmind/llm/__init__.py
+++ b/quantmind/llm/__init__.py
@@ -5,5 +5,7 @@
 
 __all__ = [
     "LLMBlock",
-    "create_llm_block"
+    "create_llm_block",
+    "EmbeddingBlock",
+    "create_embedding_block",
 ]

From 387d3de25b8631b8076806d808ce97793224c51a Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Fri, 1 Aug 2025 00:46:27 +0800
Subject: [PATCH 04/17] ruff format

---
 examples/llm/embedding_block_example.py      | 117 ++--
 examples/storage/storage_performance_demo.py |   8 +-
 quantmind/config/embedding.py                |  44 +-
 quantmind/llm/embedding.py                   | 562 ++++++++++---------
 tests/llm/test_embedding.py                  | 146 +++--
 5 files changed, 448 insertions(+), 429 deletions(-)

diff --git a/examples/llm/embedding_block_example.py b/examples/llm/embedding_block_example.py
index 76248ec..25bc954 100644
--- a/examples/llm/embedding_block_example.py
+++ b/examples/llm/embedding_block_example.py
@@ -13,7 +13,7 @@
 def example_openai_embeddings():
     """Example using OpenAI embeddings."""
     print("\n=== OpenAI Embeddings Example ===")
-    
+
     # Configuration for OpenAI embeddings
     config = EmbeddingConfig(
         model="text-embedding-ada-002",
@@ -21,39 +21,39 @@ def example_openai_embeddings():
         timeout=30,
         encoding_format="float",
     )
-    
+
     # Create embedding block
     embedding_block = create_embedding_block(config)
-    
+
     # Test connection
     if embedding_block.test_connection():
         print("✅ OpenAI connection successful")
     else:
         print("❌ OpenAI connection failed")
         return
-    
+
     # Generate single embedding
     text = "This is a sample text for embedding generation."
     embedding = embedding_block.generate_embedding(text)
-    
+
     if embedding:
         print(f"✅ Generated embedding with {len(embedding)} dimensions")
         print(f"   First 5 values: {embedding[:5]}")
-    
+
     # Generate multiple embeddings
     texts = [
         "First sample text for embedding.",
         "Second sample text with different content.",
-        "Third sample text for batch processing."
+        "Third sample text for batch processing.",
     ]
-    
+
     embeddings = embedding_block.generate_embeddings(texts)
-    
+
     if embeddings:
         print(f"✅ Generated {len(embeddings)} embeddings")
         for i, emb in enumerate(embeddings):
-            print(f"   Text {i+1}: {len(emb)} dimensions")
-    
+            print(f"   Text {i + 1}: {len(emb)} dimensions")
+
     # Get embedding information
     info = embedding_block.get_info()
     print(f"📊 Model info: {info['model']}")
@@ -64,7 +64,7 @@ def example_openai_embeddings():
 def example_openai_text_embedding_3():
     """Example using OpenAI text-embedding-3 with custom dimensions."""
     print("\n=== OpenAI Text-Embedding-3 Example ===")
-    
+
     # Configuration for OpenAI text-embedding-3
     config = EmbeddingConfig(
         model="text-embedding-3-small",
@@ -73,39 +73,41 @@ def example_openai_text_embedding_3():
         timeout=30,
         encoding_format="float",
     )
-    
+
     # Create embedding block
     embedding_block = create_embedding_block(config)
-    
+
     # Test connection
     if embedding_block.test_connection():
         print("✅ OpenAI text-embedding-3 connection successful")
     else:
         print("❌ OpenAI text-embedding-3 connection failed")
         return
-    
+
     # Generate single embedding
-    text = "This is a sample text for embedding generation with custom dimensions."
+    text = (
+        "This is a sample text for embedding generation with custom dimensions."
+    )
     embedding = embedding_block.generate_embedding(text)
-    
+
     if embedding:
         print(f"✅ Generated embedding with {len(embedding)} dimensions")
         print(f"   First 5 values: {embedding[:5]}")
-    
+
     # Generate multiple embeddings
     texts = [
         "First sample text for embedding.",
         "Second sample text with different content.",
-        "Third sample text for batch processing."
+        "Third sample text for batch processing.",
     ]
-    
+
     embeddings = embedding_block.generate_embeddings(texts)
-    
+
     if embeddings:
         print(f"✅ Generated {len(embeddings)} embeddings")
         for i, emb in enumerate(embeddings):
-            print(f"   Text {i+1}: {len(emb)} dimensions")
-    
+            print(f"   Text {i + 1}: {len(emb)} dimensions")
+
     # Get embedding information
     info = embedding_block.get_info()
     print(f"📊 Model info: {info['model']}")
@@ -116,7 +118,7 @@ def example_openai_text_embedding_3():
 def example_azure_embeddings():
     """Example using Azure OpenAI embeddings."""
     print("\n=== Azure OpenAI Embeddings Example ===")
-    
+
     # Configuration for Azure OpenAI embeddings
     config = EmbeddingConfig(
         model="text-embedding-ada-002",
@@ -127,42 +129,42 @@ def example_azure_embeddings():
         timeout=30,
         encoding_format="float",
     )
-    
+
     # Create embedding block
     embedding_block = create_embedding_block(config)
-    
+
     # Create embedding block
     embedding_block = create_embedding_block(config)
-    
+
     # Test connection
     if embedding_block.test_connection():
         print("✅ Azure OpenAI connection successful")
     else:
         print("❌ Azure OpenAI connection failed")
         return
-    
+
     # Generate single embedding
     text = "This is a sample text for Azure OpenAI embedding generation."
     embedding = embedding_block.generate_embedding(text)
-    
+
     if embedding:
         print(f"✅ Generated embedding with {len(embedding)} dimensions")
         print(f"   First 5 values: {embedding[:5]}")
-    
+
     # Generate multiple embeddings
     texts = [
         "First sample text for Azure embedding.",
         "Second sample text with different content.",
-        "Third sample text for batch processing."
+        "Third sample text for batch processing.",
     ]
-    
+
     embeddings = embedding_block.generate_embeddings(texts)
-    
+
     if embeddings:
         print(f"✅ Generated {len(embeddings)} embeddings")
         for i, emb in enumerate(embeddings):
-            print(f"   Text {i+1}: {len(emb)} dimensions")
-    
+            print(f"   Text {i + 1}: {len(emb)} dimensions")
+
     # Get embedding information
     info = embedding_block.get_info()
     print(f"📊 Model info: {info['model']}")
@@ -173,33 +175,28 @@ def example_azure_embeddings():
 def example_configuration_variants():
     """Example showing different configuration variants."""
     print("\n=== Configuration Variants Example ===")
-    
+
     # Base configuration
     base_config = EmbeddingConfig(
         model="text-embedding-ada-002",
         api_key=os.getenv("OPENAI_API_KEY"),
         encoding_format="float",
     )
-    
+
     # Create variants with different parameters
-    fast_config = base_config.create_variant(
-        timeout=10,
-        retry_attempts=1
-    )
-    
+    fast_config = base_config.create_variant(timeout=10, retry_attempts=1)
+
     conservative_config = base_config.create_variant(
-        timeout=120,
-        retry_attempts=5,
-        retry_delay=2.0
+        timeout=120, retry_attempts=5, retry_delay=2.0
     )
-    
+
     print(f"Base config timeout: {base_config.timeout}s")
     print(f"Fast config timeout: {fast_config.timeout}s")
     print(f"Conservative config timeout: {conservative_config.timeout}s")
-    
+
     # Test with temporary configuration
     embedding_block = create_embedding_block(base_config)
-    
+
     with embedding_block.temporary_config(timeout=5):
         print("Using temporary configuration with 5s timeout")
         # Any embedding operations here will use the temporary config
@@ -211,27 +208,27 @@ def example_configuration_variants():
 def example_error_handling():
     """Example showing error handling and fallbacks."""
     print("\n=== Error Handling Example ===")
-    
+
     # Try with invalid API key
     config = EmbeddingConfig(
         model="text-embedding-ada-002",
         api_key="invalid_key",
         timeout=5,
     )
-    
+
     embedding_block = create_embedding_block(config)
-    
+
     # This should fail gracefully
     embedding = embedding_block.generate_embedding("Test text")
     if embedding is None:
         print("✅ Gracefully handled invalid API key")
-    
+
     # Try with non-existent model
     config = EmbeddingConfig(
         model="non-existent-model",
         timeout=5,
     )
-    
+
     try:
         embedding_block = create_embedding_block(config)
         print("❌ Should have failed with non-existent model")
@@ -243,24 +240,26 @@ def main():
     """Run all embedding examples."""
     print("🚀 EmbeddingBlock Examples")
     print("=" * 50)
-    
+
     # Run examples based on available API keys
     if os.getenv("OPENAI_API_KEY"):
         example_openai_embeddings()
         example_openai_text_embedding_3()
     else:
         print("\n⚠️  Skipping OpenAI examples - OPENAI_API_KEY not set")
-    
+
     if os.getenv("AZURE_API_KEY") and os.getenv("AZURE_API_BASE"):
         example_azure_embeddings()
     else:
-        print("\n⚠️  Skipping Azure example - AZURE_API_KEY or AZURE_API_BASE not set")
-    
+        print(
+            "\n⚠️  Skipping Azure example - AZURE_API_KEY or AZURE_API_BASE not set"
+        )
+
     example_configuration_variants()
     example_error_handling()
-    
+
     print("\n✅ All examples completed!")
 
 
 if __name__ == "__main__":
-    main() 
\ No newline at end of file
+    main()
diff --git a/examples/storage/storage_performance_demo.py b/examples/storage/storage_performance_demo.py
index a991b64..8eccfd0 100644
--- a/examples/storage/storage_performance_demo.py
+++ b/examples/storage/storage_performance_demo.py
@@ -64,7 +64,7 @@ def simulate_old_behavior(storage: LocalStorage, num_lookups: int = 50):
     old_time = end_time - start_time
 
     print(f"   Time for {num_lookups} lookups: {old_time:.4f} seconds")
-    print(f"   Average per lookup: {(old_time/num_lookups)*1000:.2f} ms")
+    print(f"   Average per lookup: {(old_time / num_lookups) * 1000:.2f} ms")
 
     return old_time
 
@@ -86,7 +86,7 @@ def test_new_indexing_performance(storage: LocalStorage, num_lookups: int = 50):
     new_time = end_time - start_time
 
     print(f"   Time for {num_lookups} lookups: {new_time:.4f} seconds")
-    print(f"   Average per lookup: {(new_time/num_lookups)*1000:.2f} ms")
+    print(f"   Average per lookup: {(new_time / num_lookups) * 1000:.2f} ms")
 
     return new_time
 
@@ -110,7 +110,7 @@ def test_knowledge_lookup_performance(
     print(
         f"   Time for {num_lookups} knowledge lookups: {lookup_time:.4f} seconds"
     )
-    print(f"   Average per lookup: {(lookup_time/num_lookups)*1000:.2f} ms")
+    print(f"   Average per lookup: {(lookup_time / num_lookups) * 1000:.2f} ms")
 
     return lookup_time
 
@@ -128,7 +128,7 @@ def test_batch_operations(storage: LocalStorage):
     count = len(all_knowledges)
 
     print(f"   Retrieved {count} knowledge items in {batch_time:.4f} seconds")
-    print(f"   Average per item: {(batch_time/count)*1000:.2f} ms")
+    print(f"   Average per item: {(batch_time / count) * 1000:.2f} ms")
 
     return batch_time
 
diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
index e3f7587..921ab0f 100644
--- a/quantmind/config/embedding.py
+++ b/quantmind/config/embedding.py
@@ -5,7 +5,6 @@
 from pydantic import BaseModel, Field, field_validator
 
 
-
 class EmbeddingConfig(BaseModel):
     """Configuration for EmbeddingBlock."""
 
@@ -16,25 +15,32 @@ class EmbeddingConfig(BaseModel):
 
     # Optional parameters
     user: Optional[str] = Field(
-        default=None, description="A unique identifier representing your end-user"
+        default=None,
+        description="A unique identifier representing your end-user",
     )
     dimensions: Optional[int] = Field(
-        default=None, description="The number of dimensions the resulting output embeddings should have. Only supported in OpenAI/Azure text-embedding-3 and later models"
+        default=None,
+        description="The number of dimensions the resulting output embeddings should have. Only supported in OpenAI/Azure text-embedding-3 and later models",
     )
     encoding_format: str = Field(
-        default="float", description="The format to return the embeddings in. Can be either 'float' or 'base64'"
+        default="float",
+        description="The format to return the embeddings in. Can be either 'float' or 'base64'",
     )
     timeout: int = Field(
-        default=600, description="The maximum time, in seconds, to wait for the API to respond"
+        default=600,
+        description="The maximum time, in seconds, to wait for the API to respond",
     )
     api_base: Optional[str] = Field(
-        default=None, description="The api endpoint you want to call the model with"
+        default=None,
+        description="The api endpoint you want to call the model with",
     )
     api_version: Optional[str] = Field(
-        default=None, description="(Azure-specific) the api version for the call"
+        default=None,
+        description="(Azure-specific) the api version for the call",
     )
     api_key: Optional[str] = Field(
-        default=None, description="The API key to authenticate and authorize requests. If not provided, the default API key is used"
+        default=None,
+        description="The API key to authenticate and authorize requests. If not provided, the default API key is used",
     )
     api_type: Optional[str] = Field(
         default=None, description="The type of API to use"
@@ -81,22 +87,26 @@ def get_litellm_params(self) -> Dict[str, Any]:
     def get_provider_type(self) -> str:
         """Extract provider type from model name."""
         model_lower = self.model.lower()
-        
+
         # OpenAI models
-        if (model_lower.startswith("text-embedding-") or 
-            model_lower.startswith("openai/") or
-            "ada" in model_lower or "3" in model_lower):
+        if (
+            model_lower.startswith("text-embedding-")
+            or model_lower.startswith("openai/")
+            or "ada" in model_lower
+            or "3" in model_lower
+        ):
             return "openai"
-        
+
         # Azure models
         elif "azure" in model_lower:
             return "azure"
-        
+
         # Cohere models
-        elif (model_lower.startswith("embed-") or
-              model_lower.startswith("cohere/")):
+        elif model_lower.startswith("embed-") or model_lower.startswith(
+            "cohere/"
+        ):
             return "cohere"
-        
+
         # Default to openai for unknown models
         else:
             return "unknown"
diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
index 10487ff..c706091 100644
--- a/quantmind/llm/embedding.py
+++ b/quantmind/llm/embedding.py
@@ -15,291 +15,305 @@
 try:
     import litellm
     from litellm import embedding
-    
+
     LITELLM_AVAILABLE = True
 except ImportError:
     LITELLM_AVAILABLE = False
 
+
 class EmbeddingBlock:
-	"""A reusable Embedding function block using LiteLLM.
-	
-	EmbeddingBlock provides a consistent interface for generating embeddings across different providers (OpenAI, Anthropic, etc.).
-	
-	Unlike workflows, EmbeddingBlock focuses on providing basic embedding capabilities without business logic."""
-	
-	def __init__(self, config: EmbeddingConfig):
-		"""Initialize the EmbeddingBlock with configuration.
-		
-		Args:
-			config: Embedding configuration
-		
-		Raises:
-			ImportError: If LiteLLM is not available.
-		"""
-		if not LITELLM_AVAILABLE:
-			raise ImportError("litellm is required for EmbeddingBlock but not installed.")
-		
-		self.config = config
-		self._setup_litellm()
-		
-		logger.info(f"Initialized EmbeddingBlock with model: {config.model}")
-
-	def _setup_litellm(self):
-		"""Setup LiteLLM configuration."""
-		# Set global LiteLLM settings
-		litellm.set_verbose = False  # Disable verbose logging by default
-		
-		# Configure retries
-		litellm.num_retries = self.config.retry_attempts
-		litellm.request_timeout = self.config.timeout
-		
-		# Set API key as environment variable if provided
-		if self.config.api_key:
-			provider_type = self.config.get_provider_type()
-			if provider_type == "openai":
-				os.environ["OPENAI_API_KEY"] = self.config.api_key
-			elif provider_type == "azure":
-				os.environ["AZURE_API_KEY"] = self.config.api_key
-			elif provider_type == "cohere":
-				os.environ["COHERE_API_KEY"] = self.config.api_key
-		
-		logger.debug(f"Configured LiteLLM for provider: {self.config.get_provider_type()}")
-	
-	
-	def generate_embedding(self, text: str, **kwargs) -> Optional[List[float]]:
-		"""Generate embedding using the configured Embedding model.
-
-		Args:
-			text (str): The input text to embed.
-			**kwargs: Additional parameters to override config
-
-		Returns:
-			List[float]: The embedding vector as a list of floats, or None if failed.
-		"""
-		try:
-			# Get LiteLLM parameters
-			params = self.config.get_litellm_params()
-			params.update(kwargs)  # Allow runtime overrides
-			
-			# Add input text
-			params["input"] = text
-			
-			# Call LiteLLM embedding
-			response = self._call_with_retry(params)
-			
-			if response and hasattr(response, 'data'):
-				# Extract embedding from response
-				embedding_data = response.data[0] if isinstance(response.data, list) else response.data
-				return embedding_data.embedding
-			
-			return None
-			
-		except Exception as e:
-			logger.error(f"Failed to generate embedding: {e}")
-			return None
-
-	def generate_embeddings(self, texts: List[str], **kwargs) -> Optional[List[List[float]]]:
-		"""Generate embeddings for multiple texts.
-
-		Args:
-			texts (List[str]): List of input texts to embed.
-			**kwargs: Additional parameters to override config
-
-		Returns:
-			List[List[float]]: List of embedding vectors, or None if failed.
-		"""
-		try:
-			# Get LiteLLM parameters
-			params = self.config.get_litellm_params()
-			params.update(kwargs)  # Allow runtime overrides
-			
-			# Add input texts
-			params["input"] = texts
-			
-			# Call LiteLLM embedding
-			response = self._call_with_retry(params)
-			
-			if response and hasattr(response, 'data'):
-				# Extract embeddings from response
-				return [item.embedding for item in response.data]
-			
-			return None
-			
-		except Exception as e:
-			logger.error(f"Failed to generate embeddings: {e}")
-			return None
-	
-	def _call_with_retry(self, params: Dict[str, Any]) -> Optional[Any]:
-		"""Call LiteLLM embedding with retry logic.
-
-		Args:
-			params (Dict[str, Any]): The parameters to pass to the embedding function.
-
-		Returns:
-			Optional[Any]: The embedding result or None if failed.
-		"""
-		last_exception = None
-		for attempt in range(self.config.retry_attempts + 1):
-			try:
-				logger.debug(
-					f"Embedding call attempt {attempt + 1}/{self.config.retry_attempts + 1}"
-				)
-				
-				# Extract input from params and remove it for the embedding call
-				input_text = params.pop("input")
-				response = embedding(model=self.config.model, input=input_text, **params)
-
-				if hasattr(response, "usage") and response.usage:
-					logger.debug(f"Token usage: {response.usage}")
-				return response
-			except Exception as e:
-				last_exception = e
-				logger.warning(f"Embedding call attempt {attempt + 1} failed: {e}")
-
-				if attempt < self.config.retry_attempts:
-					time.sleep(self.config.retry_delay)
-				else:
-					logger.error(
-						f"All {self.config.retry_attempts + 1} attempts failed"
-					)
-		
-		# Log final error
-		if last_exception:
-			logger.error(f"Final error: {last_exception}")
-
-		return None
-
-
-	def test_connection(self) -> bool:
-		"""Test if the embedding connection is working.
+    """A reusable Embedding function block using LiteLLM.
+
+    EmbeddingBlock provides a consistent interface for generating embeddings across
+    different providers (OpenAI, Anthropic, etc.).
+
+    Unlike workflows, EmbeddingBlock focuses on providing basic embedding capabilities
+    without business logic.
+    """
+
+    def __init__(self, config: EmbeddingConfig):
+        """Initialize the EmbeddingBlock with configuration.
+
+        Args:
+                config: Embedding configuration
+
+        Raises:
+                ImportError: If LiteLLM is not available.
+        """
+        if not LITELLM_AVAILABLE:
+            raise ImportError(
+                "litellm is required for EmbeddingBlock but not installed."
+            )
+
+        self.config = config
+        self._setup_litellm()
+
+        logger.info(f"Initialized EmbeddingBlock with model: {config.model}")
+
+    def _setup_litellm(self):
+        """Setup LiteLLM configuration."""
+        # Set global LiteLLM settings
+        litellm.set_verbose = False  # Disable verbose logging by default
+
+        # Configure retries
+        litellm.num_retries = self.config.retry_attempts
+        litellm.request_timeout = self.config.timeout
+
+        # Set API key as environment variable if provided
+        if self.config.api_key:
+            provider_type = self.config.get_provider_type()
+            if provider_type == "openai":
+                os.environ["OPENAI_API_KEY"] = self.config.api_key
+            elif provider_type == "azure":
+                os.environ["AZURE_API_KEY"] = self.config.api_key
+            elif provider_type == "cohere":
+                os.environ["COHERE_API_KEY"] = self.config.api_key
+
+        logger.debug(
+            f"Configured LiteLLM for provider: {self.config.get_provider_type()}"
+        )
+
+    def generate_embedding(self, text: str, **kwargs) -> Optional[List[float]]:
+        """Generate embedding using the configured Embedding model.
+
+        Args:
+                text (str): The input text to embed.
+                **kwargs: Additional parameters to override config
+
+        Returns:
+                List[float]: The embedding vector as a list of floats, or None if failed.
+        """
+        try:
+            # Get LiteLLM parameters
+            params = self.config.get_litellm_params()
+            params.update(kwargs)  # Allow runtime overrides
+
+            # Add input text
+            params["input"] = text
+
+            # Call LiteLLM embedding
+            response = self._call_with_retry(params)
+
+            if response and hasattr(response, "data"):
+                # Extract embedding from response
+                embedding_data = (
+                    response.data[0]
+                    if isinstance(response.data, list)
+                    else response.data
+                )
+                return embedding_data.embedding
+
+            return None
+
+        except Exception as e:
+            logger.error(f"Failed to generate embedding: {e}")
+            return None
+
+    def generate_embeddings(
+        self, texts: List[str], **kwargs
+    ) -> Optional[List[List[float]]]:
+        """Generate embeddings for multiple texts.
+
+        Args:
+                texts (List[str]): List of input texts to embed.
+                **kwargs: Additional parameters to override config
+
+        Returns:
+                List[List[float]]: List of embedding vectors, or None if failed.
+        """
+        try:
+            # Get LiteLLM parameters
+            params = self.config.get_litellm_params()
+            params.update(kwargs)  # Allow runtime overrides
+
+            # Add input texts
+            params["input"] = texts
+
+            # Call LiteLLM embedding
+            response = self._call_with_retry(params)
+
+            if response and hasattr(response, "data"):
+                # Extract embeddings from response
+                return [item.embedding for item in response.data]
+
+            return None
+
+        except Exception as e:
+            logger.error(f"Failed to generate embeddings: {e}")
+            return None
+
+    def _call_with_retry(self, params: Dict[str, Any]) -> Optional[Any]:
+        """Call LiteLLM embedding with retry logic.
+
+        Args:
+                params (Dict[str, Any]): The parameters to pass to the embedding function.
+
+        Returns:
+                Optional[Any]: The embedding result or None if failed.
+        """
+        last_exception = None
+        for attempt in range(self.config.retry_attempts + 1):
+            try:
+                logger.debug(
+                    f"Embedding call attempt {attempt + 1}/{self.config.retry_attempts + 1}"
+                )
+
+                # Extract input from params and remove it for the embedding call
+                input_text = params.pop("input")
+                response = embedding(
+                    model=self.config.model, input=input_text, **params
+                )
+
+                if hasattr(response, "usage") and response.usage:
+                    logger.debug(f"Token usage: {response.usage}")
+                return response
+            except Exception as e:
+                last_exception = e
+                logger.warning(
+                    f"Embedding call attempt {attempt + 1} failed: {e}"
+                )
+
+                if attempt < self.config.retry_attempts:
+                    time.sleep(self.config.retry_delay)
+                else:
+                    logger.error(
+                        f"All {self.config.retry_attempts + 1} attempts failed"
+                    )
+
+        # Log final error
+        if last_exception:
+            logger.error(f"Final error: {last_exception}")
+
+        return None
+
+    def test_connection(self) -> bool:
+        """Test if the embedding connection is working.
 
         Returns:
             True if connection is working, False otherwise
         """
-		try:
-			response = self.generate_embedding(
-				"Hello, this is a test for embedding generation. Please respond with 'OK'."
-			)
-			return response is not None and len(response) > 0
-		except Exception as e:
-			logger.error(f"Connection test failed: {e}")
-			return False
-
-
-	def get_info(self) -> Dict[str, Any]:
-		"""Get information about the embedding block.
-
-		Returns:
-			Dictionary with embedding block information
-		"""
-		info = {
-			"model": self.config.model,
-			"provider": self.config.get_provider_type(),
-			"dimension": self.get_embedding_dimension(),
-			"config": self.config.model_dump(),
-		}
-		return info
-
-	def get_embedding_dimension(self) -> Optional[int]:
-		"""Get the dimension of embeddings generated by this model.
-
-		Returns:
-			Embedding dimension or None if not available
-		"""
-		# First check if dimensions is specified in config
-		if self.config.dimensions:
-			return self.config.dimensions
-		
-		try:
-			# Try to get dimension by generating a test embedding
-			test_embedding = self.generate_embedding("test")
-			return len(test_embedding) if test_embedding else None
-		except Exception as e:
-			logger.error(f"Failed to get embedding dimension: {e}")
-			return None
-
-	def update_config(self, **kwargs) -> None:
-		"""Update the embedding configuration.
-
-		Args:
-			**kwargs: Configuration parameters to update
-		"""
-		for key, value in kwargs.items():
-			if hasattr(self.config, key):
-				setattr(self.config, key, value)
-
-		logger.info(f"Updated embedding configuration: {kwargs}")
-
-	@contextmanager
-	def temporary_config(self, **kwargs):
-		"""Temporarily modify configuration for a context.
-
-		Args:
-			**kwargs: Temporary configuration parameters
-
-		Yields:
-			Self with temporary configuration
-		"""
-		original_config = {}
-		for key, value in kwargs.items():
-			if hasattr(self.config, key):
-				original_config[key] = getattr(self.config, key)
-				setattr(self.config, key, value)
-
-		try:
-			yield self
-		finally:
-			# Restore original configuration
-			for key, value in original_config.items():
-				setattr(self.config, key, value)
-
-	def batch_embed(
-		self, 
-		texts: List[str], 
-		batch_size: int = 32,
-		**kwargs
-	) -> Optional[List[List[float]]]:
-		"""Generate embeddings in batches for large datasets.
-
-		Args:
-			texts: List of texts to embed
-			batch_size: Number of texts to process in each batch
-			**kwargs: Additional parameters for embedding generation
-
-		Returns:
-			List of embedding vectors or None if failed
-		"""
-		try:
-			all_embeddings = []
-			
-			for i in range(0, len(texts), batch_size):
-				batch = texts[i:i + batch_size]
-				batch_embeddings = self.generate_embeddings(batch, **kwargs)
-				
-				if batch_embeddings is None:
-					logger.error(f"Failed to generate embeddings for batch {i//batch_size}")
-					return None
-				
-				all_embeddings.extend(batch_embeddings)
-				
-				# Add delay between batches if specified
-				if self.config.retry_delay > 0 and i + batch_size < len(texts):
-					time.sleep(self.config.retry_delay)
-
-			return all_embeddings
-
-		except Exception as e:
-			logger.error(f"Batch embedding failed: {e}")
-			return None
+        try:
+            response = self.generate_embedding(
+                "Hello, this is a test for embedding generation. Please respond with 'OK'."
+            )
+            return response is not None and len(response) > 0
+        except Exception as e:
+            logger.error(f"Connection test failed: {e}")
+            return False
+
+    def get_info(self) -> Dict[str, Any]:
+        """Get information about the embedding block.
+
+        Returns:
+                Dictionary with embedding block information
+        """
+        info = {
+            "model": self.config.model,
+            "provider": self.config.get_provider_type(),
+            "dimension": self.get_embedding_dimension(),
+            "config": self.config.model_dump(),
+        }
+        return info
+
+    def get_embedding_dimension(self) -> Optional[int]:
+        """Get the dimension of embeddings generated by this model.
+
+        Returns:
+                Embedding dimension or None if not available
+        """
+        # First check if dimensions is specified in config
+        if self.config.dimensions:
+            return self.config.dimensions
+
+        try:
+            # Try to get dimension by generating a test embedding
+            test_embedding = self.generate_embedding("test")
+            return len(test_embedding) if test_embedding else None
+        except Exception as e:
+            logger.error(f"Failed to get embedding dimension: {e}")
+            return None
+
+    def update_config(self, **kwargs) -> None:
+        """Update the embedding configuration.
+
+        Args:
+                **kwargs: Configuration parameters to update
+        """
+        for key, value in kwargs.items():
+            if hasattr(self.config, key):
+                setattr(self.config, key, value)
+
+        logger.info(f"Updated embedding configuration: {kwargs}")
+
+    @contextmanager
+    def temporary_config(self, **kwargs):
+        """Temporarily modify configuration for a context.
+
+        Args:
+                **kwargs: Temporary configuration parameters
+
+        Yields:
+                Self with temporary configuration
+        """
+        original_config = {}
+        for key, value in kwargs.items():
+            if hasattr(self.config, key):
+                original_config[key] = getattr(self.config, key)
+                setattr(self.config, key, value)
+
+        try:
+            yield self
+        finally:
+            # Restore original configuration
+            for key, value in original_config.items():
+                setattr(self.config, key, value)
+
+    def batch_embed(
+        self, texts: List[str], batch_size: int = 32, **kwargs
+    ) -> Optional[List[List[float]]]:
+        """Generate embeddings in batches for large datasets.
+
+        Args:
+                texts: List of texts to embed
+                batch_size: Number of texts to process in each batch
+                **kwargs: Additional parameters for embedding generation
+
+        Returns:
+                List of embedding vectors or None if failed
+        """
+        try:
+            all_embeddings = []
+
+            for i in range(0, len(texts), batch_size):
+                batch = texts[i : i + batch_size]
+                batch_embeddings = self.generate_embeddings(batch, **kwargs)
+
+                if batch_embeddings is None:
+                    logger.error(
+                        f"Failed to generate embeddings for batch {i // batch_size}"
+                    )
+                    return None
+
+                all_embeddings.extend(batch_embeddings)
+
+                # Add delay between batches if specified
+                if self.config.retry_delay > 0 and i + batch_size < len(texts):
+                    time.sleep(self.config.retry_delay)
+
+            return all_embeddings
+
+        except Exception as e:
+            logger.error(f"Batch embedding failed: {e}")
+            return None
 
 
 def create_embedding_block(config: EmbeddingConfig) -> EmbeddingBlock:
-	"""Create an EmbeddingBlock instance.
+    """Create an EmbeddingBlock instance.
 
-	Args:
-		config: Embedding configuration
+    Args:
+            config: Embedding configuration
 
-	Returns:
-		Configured EmbeddingBlock instance
-	"""
-	return EmbeddingBlock(config)
\ No newline at end of file
+    Returns:
+            Configured EmbeddingBlock instance
+    """
+    return EmbeddingBlock(config)
diff --git a/tests/llm/test_embedding.py b/tests/llm/test_embedding.py
index 88bc673..96c36f5 100644
--- a/tests/llm/test_embedding.py
+++ b/tests/llm/test_embedding.py
@@ -13,7 +13,7 @@ class TestEmbeddingConfig(unittest.TestCase):
     def test_default_config(self):
         """Test default configuration."""
         config = EmbeddingConfig()
-        
+
         self.assertEqual(config.model, "text-embedding-ada-002")
         self.assertIsNone(config.api_key)
         self.assertEqual(config.timeout, 60)
@@ -28,9 +28,9 @@ def test_custom_config(self):
             timeout=30,
             batch_size=16,
             normalize=False,
-            device="cuda"
+            device="cuda",
         )
-        
+
         self.assertEqual(config.model, "sentence-transformers/all-MiniLM-L6-v2")
         self.assertEqual(config.api_key, "test_key")
         self.assertEqual(config.timeout, 30)
@@ -43,37 +43,32 @@ def test_provider_detection(self):
         # OpenAI models
         config = EmbeddingConfig(model="text-embedding-ada-002")
         self.assertEqual(config.get_provider_type(), "openai")
-        
+
         config = EmbeddingConfig(model="text-embedding-3-small")
         self.assertEqual(config.get_provider_type(), "openai")
-        
+
         # SentenceTransformers models
         config = EmbeddingConfig(model="sentence-transformers/all-MiniLM-L6-v2")
         self.assertEqual(config.get_provider_type(), "sentence_transformers")
-        
+
         config = EmbeddingConfig(model="all-MiniLM-L6-v2")
         self.assertEqual(config.get_provider_type(), "sentence_transformers")
-        
+
         # Cohere models
         config = EmbeddingConfig(model="embed-english-v3.0")
         self.assertEqual(config.get_provider_type(), "cohere")
-        
+
         config = EmbeddingConfig(model="cohere/embed-multilingual-v3.0")
         self.assertEqual(config.get_provider_type(), "cohere")
 
     def test_create_variant(self):
         """Test creating configuration variants."""
         base_config = EmbeddingConfig(
-            model="text-embedding-ada-002",
-            timeout=60,
-            batch_size=32
-        )
-        
-        variant = base_config.create_variant(
-            timeout=30,
-            batch_size=16
+            model="text-embedding-ada-002", timeout=60, batch_size=32
         )
-        
+
+        variant = base_config.create_variant(timeout=30, batch_size=16)
+
         self.assertEqual(variant.model, "text-embedding-ada-002")
         self.assertEqual(variant.timeout, 30)
         self.assertEqual(variant.batch_size, 16)
@@ -83,10 +78,10 @@ def test_validation(self):
         # Test invalid model
         with self.assertRaises(ValueError):
             EmbeddingConfig(model="")
-        
+
         with self.assertRaises(ValueError):
             EmbeddingConfig(model=None)
-        
+
         # Test invalid API key
         with self.assertRaises(ValueError):
             EmbeddingConfig(api_key=123)
@@ -98,148 +93,149 @@ class TestEmbeddingBlock(unittest.TestCase):
     def setUp(self):
         """Set up test fixtures."""
         self.config = EmbeddingConfig(
-            model="sentence-transformers/all-MiniLM-L6-v2",
-            normalize=True
+            model="sentence-transformers/all-MiniLM-L6-v2", normalize=True
         )
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_initialization(self, mock_sentence_transformer):
         """Test EmbeddingBlock initialization."""
         mock_model = Mock()
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
-        
+
         self.assertEqual(embedding_block.config, self.config)
         mock_sentence_transformer.assert_called_once_with(self.config.model)
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', False)
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", False)
     def test_initialization_missing_dependency(self):
         """Test initialization with missing dependency."""
         with self.assertRaises(ImportError):
             EmbeddingBlock(self.config)
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_generate_embedding(self, mock_sentence_transformer):
         """Test single embedding generation."""
         mock_model = Mock()
         mock_model.encode.return_value = [0.1, 0.2, 0.3, 0.4, 0.5]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         embedding = embedding_block.generate_embedding("test text")
-        
+
         self.assertEqual(embedding, [0.1, 0.2, 0.3, 0.4, 0.5])
         mock_model.encode.assert_called_once_with("test text")
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_generate_embeddings(self, mock_sentence_transformer):
         """Test multiple embedding generation."""
         mock_model = Mock()
-        mock_model.encode.return_value = [
-            [0.1, 0.2, 0.3],
-            [0.4, 0.5, 0.6]
-        ]
+        mock_model.encode.return_value = [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         embeddings = embedding_block.generate_embeddings(["text1", "text2"])
-        
+
         self.assertEqual(embeddings, [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]])
         mock_model.encode.assert_called_once_with(["text1", "text2"])
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_get_embedding_dimension(self, mock_sentence_transformer):
         """Test getting embedding dimension."""
         mock_model = Mock()
         mock_model.encode.return_value = [0.1, 0.2, 0.3, 0.4, 0.5]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         dimension = embedding_block.get_embedding_dimension()
-        
+
         self.assertEqual(dimension, 5)
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_test_connection(self, mock_sentence_transformer):
         """Test connection testing."""
         mock_model = Mock()
         mock_model.encode.return_value = [0.1, 0.2, 0.3]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         result = embedding_block.test_connection()
-        
+
         self.assertTrue(result)
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_get_info(self, mock_sentence_transformer):
         """Test getting embedding block information."""
         mock_model = Mock()
         mock_model.encode.return_value = [0.1, 0.2, 0.3]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         info = embedding_block.get_info()
-        
+
         self.assertEqual(info["model"], self.config.model)
         self.assertEqual(info["provider"], "sentence_transformers")
         self.assertEqual(info["dimension"], 3)
         self.assertIn("config", info)
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_update_config(self, mock_sentence_transformer):
         """Test configuration updates."""
         mock_model = Mock()
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
-        
+
         # Update timeout
         embedding_block.update_config(timeout=30)
         self.assertEqual(embedding_block.config.timeout, 30)
-        
+
         # Update model (should reinitialize)
-        embedding_block.update_config(model="sentence-transformers/all-mpnet-base-v2")
-        self.assertEqual(embedding_block.config.model, "sentence-transformers/all-mpnet-base-v2")
+        embedding_block.update_config(
+            model="sentence-transformers/all-mpnet-base-v2"
+        )
+        self.assertEqual(
+            embedding_block.config.model,
+            "sentence-transformers/all-mpnet-base-v2",
+        )
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_temporary_config(self, mock_sentence_transformer):
         """Test temporary configuration context manager."""
         mock_model = Mock()
         mock_model.encode.return_value = [0.1, 0.2, 0.3]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         original_timeout = embedding_block.config.timeout
-        
+
         with embedding_block.temporary_config(timeout=10):
             self.assertEqual(embedding_block.config.timeout, 10)
-        
+
         # Should be restored
         self.assertEqual(embedding_block.config.timeout, original_timeout)
 
-    @patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True)
-    @patch('quantmind.llm.embedding.SentenceTransformer')
+    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.SentenceTransformer")
     def test_batch_embed(self, mock_sentence_transformer):
         """Test batch embedding processing."""
         mock_model = Mock()
         mock_model.encode.return_value = [[0.1, 0.2], [0.3, 0.4]]
         mock_sentence_transformer.return_value = mock_model
-        
+
         embedding_block = EmbeddingBlock(self.config)
         texts = ["text1", "text2", "text3", "text4"]
-        
+
         embeddings = embedding_block.batch_embed(texts, batch_size=2)
-        
+
         self.assertEqual(len(embeddings), 4)
         # Should have been called twice (2 batches of 2)
         self.assertEqual(mock_model.encode.call_count, 2)
@@ -250,17 +246,17 @@ class TestCreateEmbeddingBlock(unittest.TestCase):
 
     def test_create_embedding_block(self):
         """Test creating embedding block."""
-        config = EmbeddingConfig(
-            model="sentence-transformers/all-MiniLM-L6-v2"
-        )
-        
-        with patch('quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE', True):
-            with patch('quantmind.llm.embedding.SentenceTransformer'):
+        config = EmbeddingConfig(model="sentence-transformers/all-MiniLM-L6-v2")
+
+        with patch(
+            "quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True
+        ):
+            with patch("quantmind.llm.embedding.SentenceTransformer"):
                 embedding_block = create_embedding_block(config)
-                
+
                 self.assertIsInstance(embedding_block, EmbeddingBlock)
                 self.assertEqual(embedding_block.config, config)
 
 
 if __name__ == "__main__":
-    unittest.main()
\ No newline at end of file
+    unittest.main()

From 2ab637ae8b8fef824fcadd417c65e03dfda8be40 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Fri, 1 Aug 2025 00:51:47 +0800
Subject: [PATCH 05/17] remove some unittest

---
 tests/llm/test_embedding.py | 241 +-----------------------------------
 1 file changed, 1 insertion(+), 240 deletions(-)

diff --git a/tests/llm/test_embedding.py b/tests/llm/test_embedding.py
index 96c36f5..7ec49d4 100644
--- a/tests/llm/test_embedding.py
+++ b/tests/llm/test_embedding.py
@@ -16,246 +16,7 @@ def test_default_config(self):
 
         self.assertEqual(config.model, "text-embedding-ada-002")
         self.assertIsNone(config.api_key)
-        self.assertEqual(config.timeout, 60)
-        self.assertEqual(config.batch_size, 32)
-        self.assertTrue(config.normalize)
-
-    def test_custom_config(self):
-        """Test custom configuration."""
-        config = EmbeddingConfig(
-            model="sentence-transformers/all-MiniLM-L6-v2",
-            api_key="test_key",
-            timeout=30,
-            batch_size=16,
-            normalize=False,
-            device="cuda",
-        )
-
-        self.assertEqual(config.model, "sentence-transformers/all-MiniLM-L6-v2")
-        self.assertEqual(config.api_key, "test_key")
-        self.assertEqual(config.timeout, 30)
-        self.assertEqual(config.batch_size, 16)
-        self.assertFalse(config.normalize)
-        self.assertEqual(config.device, "cuda")
-
-    def test_provider_detection(self):
-        """Test provider type detection."""
-        # OpenAI models
-        config = EmbeddingConfig(model="text-embedding-ada-002")
-        self.assertEqual(config.get_provider_type(), "openai")
-
-        config = EmbeddingConfig(model="text-embedding-3-small")
-        self.assertEqual(config.get_provider_type(), "openai")
-
-        # SentenceTransformers models
-        config = EmbeddingConfig(model="sentence-transformers/all-MiniLM-L6-v2")
-        self.assertEqual(config.get_provider_type(), "sentence_transformers")
-
-        config = EmbeddingConfig(model="all-MiniLM-L6-v2")
-        self.assertEqual(config.get_provider_type(), "sentence_transformers")
-
-        # Cohere models
-        config = EmbeddingConfig(model="embed-english-v3.0")
-        self.assertEqual(config.get_provider_type(), "cohere")
-
-        config = EmbeddingConfig(model="cohere/embed-multilingual-v3.0")
-        self.assertEqual(config.get_provider_type(), "cohere")
-
-    def test_create_variant(self):
-        """Test creating configuration variants."""
-        base_config = EmbeddingConfig(
-            model="text-embedding-ada-002", timeout=60, batch_size=32
-        )
-
-        variant = base_config.create_variant(timeout=30, batch_size=16)
-
-        self.assertEqual(variant.model, "text-embedding-ada-002")
-        self.assertEqual(variant.timeout, 30)
-        self.assertEqual(variant.batch_size, 16)
-
-    def test_validation(self):
-        """Test configuration validation."""
-        # Test invalid model
-        with self.assertRaises(ValueError):
-            EmbeddingConfig(model="")
-
-        with self.assertRaises(ValueError):
-            EmbeddingConfig(model=None)
-
-        # Test invalid API key
-        with self.assertRaises(ValueError):
-            EmbeddingConfig(api_key=123)
-
-
-class TestEmbeddingBlock(unittest.TestCase):
-    """Test EmbeddingBlock class."""
-
-    def setUp(self):
-        """Set up test fixtures."""
-        self.config = EmbeddingConfig(
-            model="sentence-transformers/all-MiniLM-L6-v2", normalize=True
-        )
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_initialization(self, mock_sentence_transformer):
-        """Test EmbeddingBlock initialization."""
-        mock_model = Mock()
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-
-        self.assertEqual(embedding_block.config, self.config)
-        mock_sentence_transformer.assert_called_once_with(self.config.model)
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", False)
-    def test_initialization_missing_dependency(self):
-        """Test initialization with missing dependency."""
-        with self.assertRaises(ImportError):
-            EmbeddingBlock(self.config)
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_generate_embedding(self, mock_sentence_transformer):
-        """Test single embedding generation."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [0.1, 0.2, 0.3, 0.4, 0.5]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        embedding = embedding_block.generate_embedding("test text")
-
-        self.assertEqual(embedding, [0.1, 0.2, 0.3, 0.4, 0.5])
-        mock_model.encode.assert_called_once_with("test text")
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_generate_embeddings(self, mock_sentence_transformer):
-        """Test multiple embedding generation."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        embeddings = embedding_block.generate_embeddings(["text1", "text2"])
-
-        self.assertEqual(embeddings, [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]])
-        mock_model.encode.assert_called_once_with(["text1", "text2"])
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_get_embedding_dimension(self, mock_sentence_transformer):
-        """Test getting embedding dimension."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [0.1, 0.2, 0.3, 0.4, 0.5]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        dimension = embedding_block.get_embedding_dimension()
-
-        self.assertEqual(dimension, 5)
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_test_connection(self, mock_sentence_transformer):
-        """Test connection testing."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [0.1, 0.2, 0.3]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        result = embedding_block.test_connection()
-
-        self.assertTrue(result)
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_get_info(self, mock_sentence_transformer):
-        """Test getting embedding block information."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [0.1, 0.2, 0.3]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        info = embedding_block.get_info()
-
-        self.assertEqual(info["model"], self.config.model)
-        self.assertEqual(info["provider"], "sentence_transformers")
-        self.assertEqual(info["dimension"], 3)
-        self.assertIn("config", info)
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_update_config(self, mock_sentence_transformer):
-        """Test configuration updates."""
-        mock_model = Mock()
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-
-        # Update timeout
-        embedding_block.update_config(timeout=30)
-        self.assertEqual(embedding_block.config.timeout, 30)
-
-        # Update model (should reinitialize)
-        embedding_block.update_config(
-            model="sentence-transformers/all-mpnet-base-v2"
-        )
-        self.assertEqual(
-            embedding_block.config.model,
-            "sentence-transformers/all-mpnet-base-v2",
-        )
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_temporary_config(self, mock_sentence_transformer):
-        """Test temporary configuration context manager."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [0.1, 0.2, 0.3]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        original_timeout = embedding_block.config.timeout
-
-        with embedding_block.temporary_config(timeout=10):
-            self.assertEqual(embedding_block.config.timeout, 10)
-
-        # Should be restored
-        self.assertEqual(embedding_block.config.timeout, original_timeout)
-
-    @patch("quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True)
-    @patch("quantmind.llm.embedding.SentenceTransformer")
-    def test_batch_embed(self, mock_sentence_transformer):
-        """Test batch embedding processing."""
-        mock_model = Mock()
-        mock_model.encode.return_value = [[0.1, 0.2], [0.3, 0.4]]
-        mock_sentence_transformer.return_value = mock_model
-
-        embedding_block = EmbeddingBlock(self.config)
-        texts = ["text1", "text2", "text3", "text4"]
-
-        embeddings = embedding_block.batch_embed(texts, batch_size=2)
-
-        self.assertEqual(len(embeddings), 4)
-        # Should have been called twice (2 batches of 2)
-        self.assertEqual(mock_model.encode.call_count, 2)
-
-
-class TestCreateEmbeddingBlock(unittest.TestCase):
-    """Test create_embedding_block function."""
-
-    def test_create_embedding_block(self):
-        """Test creating embedding block."""
-        config = EmbeddingConfig(model="sentence-transformers/all-MiniLM-L6-v2")
-
-        with patch(
-            "quantmind.llm.embedding.SENTENCE_TRANSFORMERS_AVAILABLE", True
-        ):
-            with patch("quantmind.llm.embedding.SentenceTransformer"):
-                embedding_block = create_embedding_block(config)
-
-                self.assertIsInstance(embedding_block, EmbeddingBlock)
-                self.assertEqual(embedding_block.config, config)
+        self.assertEqual(config.timeout, 600)
 
 
 if __name__ == "__main__":

From b70109c173534b414a781c2d7d72637cf90297ca Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sat, 2 Aug 2025 02:53:05 +0800
Subject: [PATCH 06/17] feat(embedding): update unittest

---
 quantmind/config/embedding.py                 |  37 +-
 quantmind/llm/embedding.py                    |  21 +-
 tests/config/test_embedding.py                | 315 +++++++++++++
 tests/llm/test_embedding.py                   |  23 -
 tests/llm/test_embedding_block.py             | 438 ++++++++++++++++++
 .../llm/{test_block.py => test_llm_block.py}  |   0
 6 files changed, 790 insertions(+), 44 deletions(-)
 create mode 100644 tests/config/test_embedding.py
 delete mode 100644 tests/llm/test_embedding.py
 create mode 100644 tests/llm/test_embedding_block.py
 rename tests/llm/{test_block.py => test_llm_block.py} (100%)

diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
index 921ab0f..72efec4 100644
--- a/quantmind/config/embedding.py
+++ b/quantmind/config/embedding.py
@@ -1,7 +1,9 @@
 """Embedding configuration for QuantMind."""
 
+from random import choices
 from typing import Any, Dict, Optional
 
+from litellm import retry
 from pydantic import BaseModel, Field, field_validator
 
 
@@ -30,6 +32,16 @@ class EmbeddingConfig(BaseModel):
         default=600,
         description="The maximum time, in seconds, to wait for the API to respond",
     )
+    retry_attempts: int = Field(
+        default=3,
+        ge=0,
+        description="The number of retry attempts",
+    )
+    retry_delay: float = Field(
+        default=1.0,
+        ge=0,
+        description="The delay between retries in seconds",
+    )
     api_base: Optional[str] = Field(
         default=None,
         description="The api endpoint you want to call the model with",
@@ -53,19 +65,17 @@ def validate_model(cls, v):
             raise ValueError("Model name must be a non-empty string")
         return v.strip()
 
-    @field_validator("encoding_format")
-    def validate_encoding_format(cls, v):
-        """Validate encoding format."""
-        if v not in ["float", "base64"]:
-            raise ValueError("encoding_format must be 'float' or 'base64'")
+    @field_validator("api_key")
+    def validate_api_key(cls, v):
+        """Validate API key."""
+        if v is not None and not isinstance(v, str):
+            raise ValueError("API key must be a string")
         return v
 
     def get_litellm_params(self) -> Dict[str, Any]:
         """Get parameters formatted for LiteLLM embedding."""
         params = {
             "model": self.model,
-            "encoding_format": self.encoding_format,
-            "timeout": self.timeout,
         }
 
         # Add optional parameters if provided
@@ -73,6 +83,8 @@ def get_litellm_params(self) -> Dict[str, Any]:
             params["user"] = self.user
         if self.dimensions:
             params["dimensions"] = self.dimensions
+        if self.encoding_format:
+            params["encoding_format"] = self.encoding_format
         if self.api_base:
             params["api_base"] = self.api_base
         if self.api_version:
@@ -89,12 +101,11 @@ def get_provider_type(self) -> str:
         model_lower = self.model.lower()
 
         # OpenAI models
-        if (
-            model_lower.startswith("text-embedding-")
-            or model_lower.startswith("openai/")
-            or "ada" in model_lower
-            or "3" in model_lower
-        ):
+        if model_lower in [
+            "text-embedding-ada-002",
+            "text-embedding-3-small",
+            "text-embedding-3-large",
+        ]:
             return "openai"
 
         # Azure models
diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
index c706091..a1ecbc2 100644
--- a/quantmind/llm/embedding.py
+++ b/quantmind/llm/embedding.py
@@ -158,10 +158,17 @@ def _call_with_retry(self, params: Dict[str, Any]) -> Optional[Any]:
                     f"Embedding call attempt {attempt + 1}/{self.config.retry_attempts + 1}"
                 )
 
-                # Extract input from params and remove it for the embedding call
-                input_text = params.pop("input")
+                # Create a copy of params to avoid mutation
+                call_params = params.copy()
+
+                # Extract input from params
+                input_text = call_params.pop("input")
+
+                # Remove model from params if it exists to avoid duplication
+                call_params.pop("model", None)
+
                 response = embedding(
-                    model=self.config.model, input=input_text, **params
+                    model=self.config.model, input=input_text, **call_params
                 )
 
                 if hasattr(response, "usage") and response.usage:
@@ -193,9 +200,7 @@ def test_connection(self) -> bool:
             True if connection is working, False otherwise
         """
         try:
-            response = self.generate_embedding(
-                "Hello, this is a test for embedding generation. Please respond with 'OK'."
-            )
+            response = self.generate_embedding("test")
             return response is not None and len(response) > 0
         except Exception as e:
             logger.error(f"Connection test failed: {e}")
@@ -210,8 +215,8 @@ def get_info(self) -> Dict[str, Any]:
         info = {
             "model": self.config.model,
             "provider": self.config.get_provider_type(),
-            "dimension": self.get_embedding_dimension(),
-            "config": self.config.model_dump(),
+            "timeout": self.config.timeout,
+            "retry_attempts": self.config.retry_attempts,
         }
         return info
 
diff --git a/tests/config/test_embedding.py b/tests/config/test_embedding.py
new file mode 100644
index 0000000..8c75108
--- /dev/null
+++ b/tests/config/test_embedding.py
@@ -0,0 +1,315 @@
+"""Tests for Embedding configuration."""
+
+import unittest
+from unittest.mock import patch
+
+from quantmind.config.embedding import EmbeddingConfig
+
+
+class TestEmbeddingConfig(unittest.TestCase):
+    """Test cases for EmbeddingConfig."""
+
+    def test_default_config(self):
+        """Test default configuration values."""
+        config = EmbeddingConfig()
+
+        # Test default values
+        self.assertEqual(config.model, "text-embedding-ada-002")
+        self.assertIsNone(config.user)
+        self.assertIsNone(config.dimensions)
+        self.assertEqual(config.encoding_format, "float")
+        self.assertEqual(config.timeout, 600)
+        self.assertIsNone(config.api_base)
+        self.assertIsNone(config.api_version)
+        self.assertIsNone(config.api_key)
+        self.assertIsNone(config.api_type)
+
+    def test_custom_config(self):
+        """Test custom configuration values."""
+        config = EmbeddingConfig(
+            model="text-embedding-3-small",
+            user="test_user_123",
+            dimensions=512,
+            encoding_format="base64",
+            timeout=30,
+            api_key="test-key",
+            api_base="https://api.example.com",
+            api_version="2023-05-15",
+            api_type="azure",
+        )
+
+        self.assertEqual(config.model, "text-embedding-3-small")
+        self.assertEqual(config.user, "test_user_123")
+        self.assertEqual(config.dimensions, 512)
+        self.assertEqual(config.encoding_format, "base64")
+        self.assertEqual(config.timeout, 30)
+        self.assertEqual(config.api_key, "test-key")
+        self.assertEqual(config.api_base, "https://api.example.com")
+        self.assertEqual(config.api_version, "2023-05-15")
+        self.assertEqual(config.api_type, "azure")
+
+    def test_validation_model(self):
+        """Test model validation."""
+        # Valid model
+        config = EmbeddingConfig(model="text-embedding-ada-002")
+        self.assertEqual(config.model, "text-embedding-ada-002")
+
+        # Empty model should raise error
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(model="")
+
+        # None model should raise error
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(model=None)
+
+        # Whitespace should be stripped
+        config = EmbeddingConfig(model="  text-embedding-ada-002  ")
+        self.assertEqual(config.model, "text-embedding-ada-002")
+
+    def test_validation_api_key(self):
+        """Test API key validation."""
+        # Valid API key
+        config = EmbeddingConfig(api_key="test-key")
+        self.assertEqual(config.api_key, "test-key")
+
+        # None API key is valid
+        config = EmbeddingConfig(api_key=None)
+        self.assertIsNone(config.api_key)
+
+        # Invalid API key type should raise error
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(api_key=123)
+
+        with self.assertRaises(ValueError):
+            EmbeddingConfig(api_key=[])
+
+    def test_get_provider_type(self):
+        """Test provider type detection."""
+        # OpenAI models
+        config = EmbeddingConfig(model="text-embedding-ada-002")
+        self.assertEqual(config.get_provider_type(), "openai")
+
+        config = EmbeddingConfig(model="text-embedding-3-small")
+        self.assertEqual(config.get_provider_type(), "openai")
+
+        config = EmbeddingConfig(model="text-embedding-3-large")
+        self.assertEqual(config.get_provider_type(), "openai")
+
+        # Azure models
+        config = EmbeddingConfig(model="azure/text-embedding-ada-002")
+        self.assertEqual(config.get_provider_type(), "azure")
+
+        config = EmbeddingConfig(model="text-embedding-ada-002-azure")
+        self.assertEqual(config.get_provider_type(), "azure")
+
+        # Cohere models
+        config = EmbeddingConfig(model="embed-english-v3.0")
+        self.assertEqual(config.get_provider_type(), "cohere")
+
+        config = EmbeddingConfig(model="cohere/embed-multilingual-v3.0")
+        self.assertEqual(config.get_provider_type(), "cohere")
+
+        # Unknown models
+        config = EmbeddingConfig(model="unknown-model")
+        self.assertEqual(config.get_provider_type(), "unknown")
+
+    def test_get_litellm_params_minimal(self):
+        """Test get_litellm_params with minimal configuration."""
+        config = EmbeddingConfig(model="text-embedding-ada-002")
+        params = config.get_litellm_params()
+
+        self.assertEqual(params["model"], "text-embedding-ada-002")
+        self.assertIn("encoding_format", params)
+        self.assertEqual(len(params), 2)  # Only model and encoding_format
+
+    def test_get_litellm_params_full(self):
+        """Test get_litellm_params with full configuration."""
+        config = EmbeddingConfig(
+            model="text-embedding-3-small",
+            user="test_user",
+            dimensions=512,
+            encoding_format="base64",
+            timeout=30,
+            api_key="test-key",
+            api_base="https://api.example.com",
+            api_version="2023-05-15",
+            api_type="azure",
+        )
+        params = config.get_litellm_params()
+
+        expected_params = {
+            "model": "text-embedding-3-small",
+            "user": "test_user",
+            "dimensions": 512,
+            "encoding_format": "base64",
+            "api_base": "https://api.example.com",
+            "api_version": "2023-05-15",
+            "api_key": "test-key",
+            "api_type": "azure",
+        }
+
+        self.assertEqual(params, expected_params)
+
+    def test_get_litellm_params_partial(self):
+        """Test get_litellm_params with partial configuration."""
+        config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            user="test_user",
+            dimensions=1536,
+            api_key="test-key",
+        )
+        params = config.get_litellm_params()
+
+        expected_params = {
+            "model": "text-embedding-ada-002",
+            "user": "test_user",
+            "dimensions": 1536,
+            "encoding_format": "float",
+            "api_key": "test-key",
+        }
+
+        self.assertEqual(params, expected_params)
+
+    def test_create_variant(self):
+        """Test creating configuration variants."""
+        base_config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            timeout=60,
+            api_key="base-key",
+        )
+
+        # Create variant with overrides
+        variant = base_config.create_variant(
+            timeout=30,
+            api_key="variant-key",
+            user="test_user",
+        )
+
+        # Original config should be unchanged
+        self.assertEqual(base_config.timeout, 60)
+        self.assertEqual(base_config.api_key, "base-key")
+        self.assertIsNone(base_config.user)
+
+        # Variant should have new values
+        self.assertEqual(variant.timeout, 30)
+        self.assertEqual(variant.api_key, "variant-key")
+        self.assertEqual(variant.user, "test_user")
+        self.assertEqual(variant.model, "text-embedding-ada-002")  # Unchanged
+
+    def test_create_variant_empty(self):
+        """Test creating variant with no overrides."""
+        base_config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            timeout=60,
+        )
+
+        variant = base_config.create_variant()
+
+        # Should be identical to base config
+        self.assertEqual(variant.model, base_config.model)
+        self.assertEqual(variant.timeout, base_config.timeout)
+        self.assertEqual(variant.encoding_format, base_config.encoding_format)
+
+    def test_encoding_format_validation(self):
+        """Test encoding format validation."""
+        # Valid encoding formats
+        config = EmbeddingConfig(encoding_format="float")
+        self.assertEqual(config.encoding_format, "float")
+
+        config = EmbeddingConfig(encoding_format="base64")
+        self.assertEqual(config.encoding_format, "base64")
+
+    def test_dimensions_validation(self):
+        """Test dimensions validation."""
+        # Valid dimensions
+        config = EmbeddingConfig(dimensions=512)
+        self.assertEqual(config.dimensions, 512)
+
+        config = EmbeddingConfig(dimensions=1536)
+        self.assertEqual(config.dimensions, 1536)
+
+        config = EmbeddingConfig(dimensions=3072)
+        self.assertEqual(config.dimensions, 3072)
+
+        # None is valid
+        config = EmbeddingConfig(dimensions=None)
+        self.assertIsNone(config.dimensions)
+
+        # Zero and negative dimensions should be allowed (validation handled by API)
+        config = EmbeddingConfig(dimensions=0)
+        self.assertEqual(config.dimensions, 0)
+
+        config = EmbeddingConfig(dimensions=-1)
+        self.assertEqual(config.dimensions, -1)
+
+    def test_timeout_validation(self):
+        """Test timeout validation."""
+        # Valid timeouts
+        config = EmbeddingConfig(timeout=1)
+        self.assertEqual(config.timeout, 1)
+
+        config = EmbeddingConfig(timeout=600)
+        self.assertEqual(config.timeout, 600)
+
+        config = EmbeddingConfig(timeout=3600)
+        self.assertEqual(config.timeout, 3600)
+
+        # Zero and negative timeouts should be allowed (validation handled by API)
+        config = EmbeddingConfig(timeout=0)
+        self.assertEqual(config.timeout, 0)
+
+        config = EmbeddingConfig(timeout=-1)
+        self.assertEqual(config.timeout, -1)
+
+    def test_equality(self):
+        """Test config equality."""
+        config1 = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            user="test_user",
+            dimensions=512,
+        )
+
+        config2 = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            user="test_user",
+            dimensions=512,
+        )
+
+        config3 = EmbeddingConfig(
+            model="text-embedding-3-small",
+            user="test_user",
+            dimensions=512,
+        )
+
+        self.assertEqual(config1, config2)
+        self.assertNotEqual(config1, config3)
+
+    def test_repr(self):
+        """Test config string representation."""
+        config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            user="test_user",
+            dimensions=512,
+        )
+
+        repr_str = repr(config)
+        self.assertIn("text-embedding-ada-002", repr_str)
+        self.assertIn("test_user", repr_str)
+        self.assertIn("512", repr_str)
+
+    def test_str(self):
+        """Test config string representation."""
+        config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            user="test_user",
+            dimensions=512,
+        )
+
+        str_repr = str(config)
+        self.assertIn("text-embedding-ada-002", str_repr)
+        self.assertIn("test_user", str_repr)
+        self.assertIn("512", str_repr)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/llm/test_embedding.py b/tests/llm/test_embedding.py
deleted file mode 100644
index 7ec49d4..0000000
--- a/tests/llm/test_embedding.py
+++ /dev/null
@@ -1,23 +0,0 @@
-"""Tests for EmbeddingBlock."""
-
-import unittest
-from unittest.mock import Mock, patch
-
-from quantmind.config import EmbeddingConfig
-from quantmind.llm import EmbeddingBlock, create_embedding_block
-
-
-class TestEmbeddingConfig(unittest.TestCase):
-    """Test EmbeddingConfig class."""
-
-    def test_default_config(self):
-        """Test default configuration."""
-        config = EmbeddingConfig()
-
-        self.assertEqual(config.model, "text-embedding-ada-002")
-        self.assertIsNone(config.api_key)
-        self.assertEqual(config.timeout, 600)
-
-
-if __name__ == "__main__":
-    unittest.main()
diff --git a/tests/llm/test_embedding_block.py b/tests/llm/test_embedding_block.py
new file mode 100644
index 0000000..4b24cac
--- /dev/null
+++ b/tests/llm/test_embedding_block.py
@@ -0,0 +1,438 @@
+"""Tests for EmbeddingBlock."""
+
+import unittest
+from unittest import mock
+from unittest.mock import Mock, patch
+
+from quantmind.config import EmbeddingConfig
+from quantmind.llm import EmbeddingBlock, create_embedding_block
+
+
+class TestEmbeddingBlock(unittest.TestCase):
+    """Test cases for EmbeddingBlock."""
+
+    def setUp(self):
+        """Set up test fixtures."""
+        self.config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            api_key="test-key",
+            timeout=30,
+        )
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    def test_init_success(self, mock_litellm):
+        """Test successful initialization."""
+        block = EmbeddingBlock(self.config)
+
+        self.assertEqual(block.config, self.config)
+        mock_litellm.set_verbose = False
+        self.assertEqual(mock_litellm.num_retries, 3)
+        self.assertEqual(mock_litellm.request_timeout, 30)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", False)
+    def test_init_litellm_unavailable(self):
+        """Test initialization when LiteLLM is not available."""
+        with self.assertRaises(ImportError) as context:
+            EmbeddingBlock(self.config)
+
+        self.assertIn(
+            "litellm is required for EmbeddingBlock", str(context.exception)
+        )
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("os.environ", {})
+    def test_setup_litellm_openai(self, mock_litellm):
+        """Test LiteLLM setup for OpenAI."""
+        config = EmbeddingConfig(
+            model="text-embedding-ada-002", api_key="test-key"
+        )
+
+        with patch("os.environ", {}) as mock_env:
+            block = EmbeddingBlock(config)
+            self.assertEqual(mock_env.get("OPENAI_API_KEY"), "test-key")
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("os.environ", {})
+    def test_setup_litellm_azure(self, mock_litellm):
+        """Test LiteLLM setup for Azure."""
+        config = EmbeddingConfig(
+            model="azure/text-embedding-ada-002", api_key="azure-key"
+        )
+
+        with patch("os.environ", {}) as mock_env:
+            block = EmbeddingBlock(config)
+            self.assertEqual(mock_env.get("AZURE_API_KEY"), "azure-key")
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_generate_embedding_success(self, mock_embedding, mock_litellm):
+        """Test successful single embedding generation."""
+        # Mock response
+        mock_response = Mock()
+        mock_response.data = [Mock()]
+        mock_response.data[0].embedding = [0.1, 0.2, 0.3, 0.4, 0.5]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        result = block.generate_embedding("Test text")
+
+        self.assertEqual(result, [0.1, 0.2, 0.3, 0.4, 0.5])
+        mock_embedding.assert_called_once()
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_generate_embedding_failure(self, mock_embedding, mock_litellm):
+        """Test embedding generation failure."""
+        mock_embedding.side_effect = Exception("API Error")
+
+        block = EmbeddingBlock(self.config)
+        result = block.generate_embedding("Test text")
+
+        self.assertIsNone(result)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_generate_embeddings_success(self, mock_embedding, mock_litellm):
+        """Test successful multiple embedding generation."""
+        # Mock response
+        mock_response = Mock()
+        mock_response.data = [
+            Mock(embedding=[0.1, 0.2, 0.3]),
+            Mock(embedding=[0.4, 0.5, 0.6]),
+        ]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        result = block.generate_embeddings(["Text 1", "Text 2"])
+
+        self.assertEqual(result, [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]])
+        mock_embedding.assert_called_once()
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_generate_embeddings_failure(self, mock_embedding, mock_litellm):
+        """Test multiple embedding generation failure."""
+        mock_embedding.side_effect = Exception("API Error")
+
+        block = EmbeddingBlock(self.config)
+        result = block.generate_embeddings(["Text 1", "Text 2"])
+
+        self.assertIsNone(result)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_call_with_retry_success(self, mock_embedding, mock_litellm):
+        """Test successful call with retry."""
+        mock_response = Mock()
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        result = block._call_with_retry(
+            {"model": "text-embedding-ada-002", "input": "test"}
+        )
+
+        self.assertEqual(result, mock_response)
+        mock_embedding.assert_called_once()
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    @patch("time.sleep")
+    def test_call_with_retry_failure_then_success(
+        self, mock_sleep, mock_embedding, mock_litellm
+    ):
+        """Test retry logic with failure then success."""
+        mock_response = Mock()
+        mock_embedding.side_effect = [
+            Exception("First failure"),
+            mock_response,
+        ]
+
+        block = EmbeddingBlock(self.config)
+        result = block._call_with_retry(
+            {"model": "text-embedding-ada-002", "input": "test"}
+        )
+
+        self.assertEqual(result, mock_response)
+        self.assertEqual(mock_embedding.call_count, 2)
+        mock_sleep.assert_called_once_with(1.0)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    @patch("time.sleep")
+    def test_call_with_retry_all_failures(
+        self, mock_sleep, mock_embedding, mock_litellm
+    ):
+        """Test retry logic with all failures."""
+        mock_embedding.side_effect = Exception("Always fails")
+
+        block = EmbeddingBlock(self.config)
+        result = block._call_with_retry(
+            {"model": "text-embedding-ada-002", "input": "test"}
+        )
+
+        self.assertIsNone(result)
+        self.assertEqual(mock_embedding.call_count, 4)  # 1 initial + 3 retries
+        self.assertEqual(mock_sleep.call_count, 3)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_test_connection_success(self, mock_embedding, mock_litellm):
+        """Test successful connection test."""
+        mock_response = Mock()
+        mock_response.data = [Mock()]
+        mock_response.data[0].embedding = [0.1, 0.2, 0.3]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        result = block.test_connection()
+
+        self.assertTrue(result)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_test_connection_failure(self, mock_embedding, mock_litellm):
+        """Test connection test failure."""
+        mock_embedding.side_effect = Exception("Connection failed")
+
+        block = EmbeddingBlock(self.config)
+        result = block.test_connection()
+
+        self.assertFalse(result)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_get_embedding_dimension_from_config(
+        self, mock_embedding, mock_litellm
+    ):
+        """Test getting embedding dimension from config."""
+        config = EmbeddingConfig(
+            model="text-embedding-3-small",
+            dimensions=512,
+        )
+        block = EmbeddingBlock(config)
+        dimension = block.get_embedding_dimension()
+
+        self.assertEqual(dimension, 512)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_get_embedding_dimension_from_test_embedding(
+        self, mock_embedding, mock_litellm
+    ):
+        """Test getting embedding dimension by generating test embedding."""
+        mock_response = Mock()
+        mock_response.data = [Mock()]
+        mock_response.data[0].embedding = [0.1, 0.2, 0.3, 0.4, 0.5]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        dimension = block.get_embedding_dimension()
+
+        self.assertEqual(dimension, 5)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_get_embedding_dimension_failure(
+        self, mock_embedding, mock_litellm
+    ):
+        """Test getting embedding dimension when test embedding fails."""
+        mock_embedding.side_effect = Exception("API Error")
+
+        block = EmbeddingBlock(self.config)
+        dimension = block.get_embedding_dimension()
+
+        self.assertIsNone(dimension)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    def test_get_info(self, mock_litellm):
+        """Test getting block info."""
+        block = EmbeddingBlock(self.config)
+        info = block.get_info()
+
+        expected_keys = ["model", "provider", "timeout", "retry_attempts"]
+        for key in expected_keys:
+            self.assertIn(key, info)
+
+        self.assertEqual(info["model"], "text-embedding-ada-002")
+        self.assertEqual(info["provider"], "openai")
+        self.assertEqual(info["timeout"], 30)
+        self.assertEqual(info["retry_attempts"], 3)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    def test_update_config(self, mock_litellm):
+        """Test configuration update."""
+        block = EmbeddingBlock(self.config)
+
+        # Check initial config
+        self.assertEqual(block.config.timeout, 30)
+        self.assertEqual(block.config.api_key, "test-key")
+
+        # Update config
+        block.update_config(timeout=60, api_key="new-key")
+
+        # Check updated config
+        self.assertEqual(block.config.timeout, 60)
+        self.assertEqual(block.config.api_key, "new-key")
+        # Other values should remain unchanged
+        self.assertEqual(block.config.model, "text-embedding-ada-002")
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    def test_temporary_config(self, mock_litellm):
+        """Test temporary configuration context manager."""
+        block = EmbeddingBlock(self.config)
+
+        # Check initial config
+        self.assertEqual(block.config.timeout, 30)
+
+        # Use temporary config
+        with block.temporary_config(timeout=60):
+            self.assertEqual(block.config.timeout, 60)
+
+        # Check config is restored
+        self.assertEqual(block.config.timeout, 30)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_batch_embed_success(self, mock_embedding, mock_litellm):
+        """Test successful batch embedding."""
+        mock_response = Mock()
+        mock_response.data = [
+            Mock(embedding=[0.1, 0.2]),
+            Mock(embedding=[0.3, 0.4]),
+        ]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        texts = ["Text 1", "Text 2", "Text 3", "Text 4"]
+        result = block.batch_embed(texts, batch_size=2)
+
+        expected = [[0.1, 0.2], [0.3, 0.4], [0.1, 0.2], [0.3, 0.4]]
+        self.assertEqual(result, expected)
+        self.assertEqual(mock_embedding.call_count, 2)  # 2 batches
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_batch_embed_failure(self, mock_embedding, mock_litellm):
+        """Test batch embedding failure."""
+        mock_embedding.side_effect = Exception("API Error")
+
+        block = EmbeddingBlock(self.config)
+        texts = ["Text 1", "Text 2", "Text 3", "Text 4"]
+        result = block.batch_embed(texts, batch_size=2)
+
+        self.assertIsNone(result)
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    @patch("time.sleep")
+    def test_batch_embed_with_delay(
+        self, mock_sleep, mock_embedding, mock_litellm
+    ):
+        """Test batch embedding with delay between batches."""
+        config = EmbeddingConfig(
+            model="text-embedding-ada-002",
+            api_key="test-key",
+            timeout=30,
+            retry_delay=0.1,
+        )
+
+        mock_response = Mock()
+        mock_response.data = [
+            Mock(embedding=[0.1, 0.2]),
+            Mock(embedding=[0.3, 0.4]),
+        ]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(config)
+        texts = ["Text 1", "Text 2", "Text 3", "Text 4"]
+        result = block.batch_embed(texts, batch_size=2)
+
+        # Should have delay between batches
+        self.assertEqual(mock_sleep.call_count, 1)  # Delay between 2 batches
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_generate_embedding_with_kwargs(self, mock_embedding, mock_litellm):
+        """Test embedding generation with additional kwargs."""
+        mock_response = Mock()
+        mock_response.data = [Mock()]
+        mock_response.data[0].embedding = [0.1, 0.2, 0.3]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        result = block.generate_embedding(
+            "Test text", dimensions=512, user="test_user"
+        )
+
+        # Check that kwargs were passed to the embedding call
+        call_args = mock_embedding.call_args
+        self.assertIn("dimensions", call_args[1])
+        self.assertIn("user", call_args[1])
+        self.assertEqual(call_args[1]["dimensions"], 512)
+        self.assertEqual(call_args[1]["user"], "test_user")
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    @patch("quantmind.llm.embedding.embedding")
+    def test_generate_embeddings_with_kwargs(
+        self, mock_embedding, mock_litellm
+    ):
+        """Test multiple embedding generation with additional kwargs."""
+        mock_response = Mock()
+        mock_response.data = [
+            Mock(embedding=[0.1, 0.2]),
+            Mock(embedding=[0.3, 0.4]),
+        ]
+        mock_embedding.return_value = mock_response
+
+        block = EmbeddingBlock(self.config)
+        result = block.generate_embeddings(
+            ["Text 1", "Text 2"], dimensions=512, user="test_user"
+        )
+
+        # Check that kwargs were passed to the embedding call
+        call_args = mock_embedding.call_args
+        self.assertIn("dimensions", call_args[1])
+        self.assertIn("user", call_args[1])
+        self.assertEqual(call_args[1]["dimensions"], 512)
+        self.assertEqual(call_args[1]["user"], "test_user")
+
+
+class TestCreateEmbeddingBlock(unittest.TestCase):
+    """Test cases for create_embedding_block function."""
+
+    @patch("quantmind.llm.embedding.LITELLM_AVAILABLE", True)
+    @patch("quantmind.llm.embedding.litellm")
+    def test_create_embedding_block(self, mock_litellm):
+        """Test EmbeddingBlock creation."""
+        config = EmbeddingConfig(model="text-embedding-ada-002")
+        block = create_embedding_block(config)
+
+        self.assertIsInstance(block, EmbeddingBlock)
+        self.assertEqual(block.config, config)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/llm/test_block.py b/tests/llm/test_llm_block.py
similarity index 100%
rename from tests/llm/test_block.py
rename to tests/llm/test_llm_block.py

From c0622a310332dc634bd454fc424f1945a4061241 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sat, 2 Aug 2025 03:02:35 +0800
Subject: [PATCH 07/17] fix(embedding): trim trailing whitespace

---
 wiki/embedding.md | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/wiki/embedding.md b/wiki/embedding.md
index 854c151..158a37b 100644
--- a/wiki/embedding.md
+++ b/wiki/embedding.md
@@ -170,14 +170,14 @@ from sklearn.metrics.pairwise import cosine_similarity
 def calculate_similarity(text1: str, text2: str) -> float:
     """Calculate semantic similarity between two texts."""
     embeddings = embedding_block.generate_embeddings([text1, text2])
-    
+
     if embeddings and len(embeddings) == 2:
         similarity = cosine_similarity(
-            [embeddings[0]], 
+            [embeddings[0]],
             [embeddings[1]]
         )[0][0]
         return similarity
-    
+
     return 0.0
 
 # Example usage
@@ -244,7 +244,7 @@ print(f"Format: {info['encoding_format']}")
 def efficient_batch_embedding(texts: List[str], batch_size: int = 100):
     """Process texts in optimal batches."""
     all_embeddings = []
-    
+
     for i in range(0, len(texts), batch_size):
         batch = texts[i:i + batch_size]
         try:
@@ -253,7 +253,7 @@ def efficient_batch_embedding(texts: List[str], batch_size: int = 100):
                 all_embeddings.extend(batch_embeddings)
         except Exception as e:
             print(f"Error processing batch {i//batch_size + 1}: {e}")
-    
+
     return all_embeddings
 ```
 
@@ -271,7 +271,7 @@ def robust_embedding_generation(text: str, max_retries: int = 3):
             print(f"Attempt {attempt + 1} failed: {e}")
             if attempt < max_retries - 1:
                 time.sleep(2 ** attempt)  # Exponential backoff
-    
+
     return None
 ```
 
@@ -287,25 +287,25 @@ class CachedEmbeddingBlock:
         self.embedding_block = embedding_block
         self.cache_dir = cache_dir
         os.makedirs(cache_dir, exist_ok=True)
-    
+
     def get_embedding(self, text: str) -> Optional[List[float]]:
         # Create cache key
         text_hash = hashlib.md5(text.encode()).hexdigest()
         cache_file = os.path.join(self.cache_dir, f"{text_hash}.pkl")
-        
+
         # Check cache
         if os.path.exists(cache_file):
             with open(cache_file, 'rb') as f:
                 return pickle.load(f)
-        
+
         # Generate embedding
         embedding = self.embedding_block.generate_embedding(text)
-        
+
         # Cache result
         if embedding:
             with open(cache_file, 'wb') as f:
                 pickle.dump(embedding, f)
-        
+
         return embedding
 ```
 
@@ -323,4 +323,4 @@ class CachedEmbeddingBlock:
 
 ---
 
-*Last updated: January 2025* 
\ No newline at end of file
+*Last updated: January 2025*

From 6de8b01d769f865da41dd40ea910a8db543faf5d Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sat, 2 Aug 2025 03:04:00 +0800
Subject: [PATCH 08/17] fix(embedding): trim trailing whitespace

---
 docs/EMBEDDINGS.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/EMBEDDINGS.md b/docs/EMBEDDINGS.md
index ff5176a..2a60ba1 100644
--- a/docs/EMBEDDINGS.md
+++ b/docs/EMBEDDINGS.md
@@ -73,4 +73,4 @@ config = EmbeddingConfig(
 
 ## See Also
 
-- `examples/llm/embedding_block_example.py` for complete examples 
\ No newline at end of file
+- `examples/llm/embedding_block_example.py` for complete examples

From d9306b6b91b585020563d1e3e93894a708b55ca1 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <13122919903@163.com>
Date: Sat, 2 Aug 2025 12:33:02 +0800
Subject: [PATCH 09/17] feat(embedding): Remove unused code in
 quantmind/config/embedding.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 quantmind/config/embedding.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
index 72efec4..bf2b6c9 100644
--- a/quantmind/config/embedding.py
+++ b/quantmind/config/embedding.py
@@ -1,6 +1,5 @@
 """Embedding configuration for QuantMind."""
 
-from random import choices
 from typing import Any, Dict, Optional
 
 from litellm import retry

From dfe32f9c14533fe73bb9aff6bd02d7067f67eaf0 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <13122919903@163.com>
Date: Sat, 2 Aug 2025 12:33:12 +0800
Subject: [PATCH 10/17] feat(embedding): Remove unused code in
 quantmind/config/embedding.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 quantmind/config/embedding.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
index bf2b6c9..cf78e0d 100644
--- a/quantmind/config/embedding.py
+++ b/quantmind/config/embedding.py
@@ -2,7 +2,6 @@
 
 from typing import Any, Dict, Optional
 
-from litellm import retry
 from pydantic import BaseModel, Field, field_validator
 
 

From feccbfb47c989fcc53ec033c9fe357c40d6506a7 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <13122919903@163.com>
Date: Sat, 2 Aug 2025 12:33:26 +0800
Subject: [PATCH 11/17] feat(embedding): Remove unused code in
 quantmind/llm/embedding.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 quantmind/llm/embedding.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
index a1ecbc2..37bae3c 100644
--- a/quantmind/llm/embedding.py
+++ b/quantmind/llm/embedding.py
@@ -2,7 +2,6 @@
 
 import os
 import time
-import numpy as np
 from contextlib import contextmanager
 from typing import Any, Dict, List, Optional
 

From e9c3169a5582f120d892e93a84c24f19cedd4cb9 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <13122919903@163.com>
Date: Sat, 2 Aug 2025 12:33:38 +0800
Subject: [PATCH 12/17] feat(embedding): Remove unused code in
 examples/llm/embedding_block_example.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 examples/llm/embedding_block_example.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/examples/llm/embedding_block_example.py b/examples/llm/embedding_block_example.py
index 25bc954..7ffdc78 100644
--- a/examples/llm/embedding_block_example.py
+++ b/examples/llm/embedding_block_example.py
@@ -135,7 +135,6 @@ def example_azure_embeddings():
 
     # Create embedding block
     embedding_block = create_embedding_block(config)
-
     # Test connection
     if embedding_block.test_connection():
         print("✅ Azure OpenAI connection successful")

From 37405f7dcfe8f8bff0dd9a098b50b68462113857 Mon Sep 17 00:00:00 2001
From: Du BIAN <scncdba@gmail.com>
Date: Tue, 29 Jul 2025 19:39:32 +0800
Subject: [PATCH 13/17] chore(readme): optimize the text description in README
 (#44)

---
 README.md | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index b87326a..246f9dc 100644
--- a/README.md
+++ b/README.md
@@ -31,16 +31,26 @@
 ---
 
 **QuantMind** is an intelligent knowledge extraction and retrieval framework for quantitative finance. It transforms unstructured financial content—papers, news, blogs, reports—into a queryable knowledge base, enabling AI-powered research at scale.
+### 🧐 Overview
+QuantMind is a next-generation AI platform that ingests, processes, and structures **every** new piece of quantitative-finance research, including papers, news, blogs, and SEC filings into a **semantic knowledge graph**. Institutional investors, hedge funds, and research teams can now explore the frontier of factor strategies, risk models, and market insights in **seconds**, unlocking alpha that would otherwise remain buried.
 
 ### ✨ Why QuantMind?
 
-The financial research landscape is overwhelming. Every day, hundreds of papers, articles, and reports are published. **QuantMind** solves this by:
+The financial research landscape is overwhelming. Every day, hundreds of papers, articles, and reports are published.
 
+
+#### 🌐 The Opportunity
+- **Information Overload**: 500 new research papers & reports published daily. Manual review takes weeks—costly, error-prone, and non-scalable
+- **Massive Market**: Financial data & analytics market ≫ expected to grow to US$961.89 billion by 2032, with a compound annual growth rate of 13.5%. Tens of thousands of quant teams & asset managers hungry for speed
+- **High ROI**: 1% improvement in research efficiency can translate to millions saved or earned in trading performance
+
+---
+
+#### 💡 **QuantMind** solves this by:
 - 🔍 **Extracting** structured knowledge from any source (PDFs, web pages, APIs)
 - 🧠 **Understanding** content with domain-specific LLMs fine-tuned for finance
 - 💾 **Storing** information in a semantic knowledge graph
 - 🚀 **Retrieving** insights through natural language queries
-
 ---
 
 ### System Architecture

From d6435bfa98e79ee95f678210b83922a86aad34f3 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sat, 2 Aug 2025 12:36:37 +0800
Subject: [PATCH 14/17] feat(embedding): remove duplicate code

---
 examples/llm/embedding_block_example.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/examples/llm/embedding_block_example.py b/examples/llm/embedding_block_example.py
index 7ffdc78..d47f044 100644
--- a/examples/llm/embedding_block_example.py
+++ b/examples/llm/embedding_block_example.py
@@ -133,8 +133,6 @@ def example_azure_embeddings():
     # Create embedding block
     embedding_block = create_embedding_block(config)
 
-    # Create embedding block
-    embedding_block = create_embedding_block(config)
     # Test connection
     if embedding_block.test_connection():
         print("✅ Azure OpenAI connection successful")

From 7365076581c794f8e9fabfa7408fdd9b306e3a48 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sat, 2 Aug 2025 23:31:48 +0800
Subject: [PATCH 15/17] feat(embedding): fix comments

---
 quantmind/config/embedding.py |  6 ++----
 quantmind/llm/embedding.py    | 40 +++++++++++++++++------------------
 2 files changed, 22 insertions(+), 24 deletions(-)

diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
index cf78e0d..2633e75 100644
--- a/quantmind/config/embedding.py
+++ b/quantmind/config/embedding.py
@@ -111,10 +111,8 @@ def get_provider_type(self) -> str:
             return "azure"
 
         # Cohere models
-        elif model_lower.startswith("embed-") or model_lower.startswith(
-            "cohere/"
-        ):
-            return "cohere"
+        elif "gemini" in model_lower:
+            return "gemini"
 
         # Default to openai for unknown models
         else:
diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
index 37bae3c..36bddbf 100644
--- a/quantmind/llm/embedding.py
+++ b/quantmind/llm/embedding.py
@@ -34,10 +34,10 @@ def __init__(self, config: EmbeddingConfig):
         """Initialize the EmbeddingBlock with configuration.
 
         Args:
-                config: Embedding configuration
+            config: Embedding configuration
 
         Raises:
-                ImportError: If LiteLLM is not available.
+            ImportError: If LiteLLM is not available.
         """
         if not LITELLM_AVAILABLE:
             raise ImportError(
@@ -76,11 +76,11 @@ def generate_embedding(self, text: str, **kwargs) -> Optional[List[float]]:
         """Generate embedding using the configured Embedding model.
 
         Args:
-                text (str): The input text to embed.
-                **kwargs: Additional parameters to override config
+            text (str): The input text to embed.
+            **kwargs: Additional parameters to override config
 
         Returns:
-                List[float]: The embedding vector as a list of floats, or None if failed.
+            List[float]: The embedding vector as a list of floats, or None if failed.
         """
         try:
             # Get LiteLLM parameters
@@ -114,11 +114,11 @@ def generate_embeddings(
         """Generate embeddings for multiple texts.
 
         Args:
-                texts (List[str]): List of input texts to embed.
-                **kwargs: Additional parameters to override config
+            texts (List[str]): List of input texts to embed.
+            **kwargs: Additional parameters to override config
 
         Returns:
-                List[List[float]]: List of embedding vectors, or None if failed.
+            List[List[float]]: List of embedding vectors, or None if failed.
         """
         try:
             # Get LiteLLM parameters
@@ -145,10 +145,10 @@ def _call_with_retry(self, params: Dict[str, Any]) -> Optional[Any]:
         """Call LiteLLM embedding with retry logic.
 
         Args:
-                params (Dict[str, Any]): The parameters to pass to the embedding function.
+            params (Dict[str, Any]): The parameters to pass to the embedding function.
 
         Returns:
-                Optional[Any]: The embedding result or None if failed.
+            Optional[Any]: The embedding result or None if failed.
         """
         last_exception = None
         for attempt in range(self.config.retry_attempts + 1):
@@ -223,7 +223,7 @@ def get_embedding_dimension(self) -> Optional[int]:
         """Get the dimension of embeddings generated by this model.
 
         Returns:
-                Embedding dimension or None if not available
+            Embedding dimension or None if not available
         """
         # First check if dimensions is specified in config
         if self.config.dimensions:
@@ -241,7 +241,7 @@ def update_config(self, **kwargs) -> None:
         """Update the embedding configuration.
 
         Args:
-                **kwargs: Configuration parameters to update
+            **kwargs: Configuration parameters to update
         """
         for key, value in kwargs.items():
             if hasattr(self.config, key):
@@ -254,10 +254,10 @@ def temporary_config(self, **kwargs):
         """Temporarily modify configuration for a context.
 
         Args:
-                **kwargs: Temporary configuration parameters
+            **kwargs: Temporary configuration parameters
 
         Yields:
-                Self with temporary configuration
+            Self with temporary configuration
         """
         original_config = {}
         for key, value in kwargs.items():
@@ -278,12 +278,12 @@ def batch_embed(
         """Generate embeddings in batches for large datasets.
 
         Args:
-                texts: List of texts to embed
-                batch_size: Number of texts to process in each batch
-                **kwargs: Additional parameters for embedding generation
+            texts: List of texts to embed
+            batch_size: Number of texts to process in each batch
+            **kwargs: Additional parameters for embedding generation
 
         Returns:
-                List of embedding vectors or None if failed
+            List of embedding vectors or None if failed
         """
         try:
             all_embeddings = []
@@ -315,9 +315,9 @@ def create_embedding_block(config: EmbeddingConfig) -> EmbeddingBlock:
     """Create an EmbeddingBlock instance.
 
     Args:
-            config: Embedding configuration
+        config: Embedding configuration
 
     Returns:
-            Configured EmbeddingBlock instance
+        Configured EmbeddingBlock instance
     """
     return EmbeddingBlock(config)

From 549b6db863679c8fa83123b5d9c1c1e68209ede7 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sat, 2 Aug 2025 23:37:45 +0800
Subject: [PATCH 16/17] feat(embedding): fix comments

---
 quantmind/llm/embedding.py     | 4 ++--
 tests/config/test_embedding.py | 9 +++------
 wiki/embedding.md              | 2 --
 3 files changed, 5 insertions(+), 10 deletions(-)

diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
index 36bddbf..3bf56db 100644
--- a/quantmind/llm/embedding.py
+++ b/quantmind/llm/embedding.py
@@ -65,8 +65,8 @@ def _setup_litellm(self):
                 os.environ["OPENAI_API_KEY"] = self.config.api_key
             elif provider_type == "azure":
                 os.environ["AZURE_API_KEY"] = self.config.api_key
-            elif provider_type == "cohere":
-                os.environ["COHERE_API_KEY"] = self.config.api_key
+            elif provider_type == "gemini":
+                os.environ["GEMINI_API_KEY"] = self.config.api_key
 
         logger.debug(
             f"Configured LiteLLM for provider: {self.config.get_provider_type()}"
diff --git a/tests/config/test_embedding.py b/tests/config/test_embedding.py
index 8c75108..d51e434 100644
--- a/tests/config/test_embedding.py
+++ b/tests/config/test_embedding.py
@@ -102,12 +102,9 @@ def test_get_provider_type(self):
         config = EmbeddingConfig(model="text-embedding-ada-002-azure")
         self.assertEqual(config.get_provider_type(), "azure")
 
-        # Cohere models
-        config = EmbeddingConfig(model="embed-english-v3.0")
-        self.assertEqual(config.get_provider_type(), "cohere")
-
-        config = EmbeddingConfig(model="cohere/embed-multilingual-v3.0")
-        self.assertEqual(config.get_provider_type(), "cohere")
+        # Gemini models
+        config = EmbeddingConfig(model="gemini/embed-multilingual-v3.0")
+        self.assertEqual(config.get_provider_type(), "gemini")
 
         # Unknown models
         config = EmbeddingConfig(model="unknown-model")
diff --git a/wiki/embedding.md b/wiki/embedding.md
index 158a37b..54bd300 100644
--- a/wiki/embedding.md
+++ b/wiki/embedding.md
@@ -42,7 +42,6 @@ Embeddings map discrete objects (words, sentences, documents) to continuous vect
 | `text-embedding-ada-002` | 1536 | General purpose | OpenAI |
 | `text-embedding-3-small` | 1536 | High performance | OpenAI |
 | `text-embedding-3-large` | 3072 | Maximum quality | OpenAI |
-| `embed-english-v3.0` | 1024 | Multilingual | Cohere |
 
 ## 📌 Architecture
 
@@ -318,7 +317,6 @@ class CachedEmbeddingBlock:
 ## 🔗 External Resources
 
 - [OpenAI Embeddings Guide](https://platform.openai.com/docs/guides/embeddings)
-- [Cohere Embeddings](https://docs.cohere.com/docs/embeddings)
 - [Vector Similarity Search](https://www.pinecone.io/learn/vector-similarity-search/)
 
 ---

From 858ea9bedf6bade0da980ef8fd43b71315a5f0f4 Mon Sep 17 00:00:00 2001
From: bridgeqiqi <Bridgeqiqi@163.com>
Date: Sun, 3 Aug 2025 00:38:32 +0800
Subject: [PATCH 17/17] feat(embedding): fix comments

---
 examples/llm/embedding_block_example.py | 57 -------------------------
 quantmind/config/embedding.py           |  2 +-
 quantmind/llm/embedding.py              |  2 +-
 3 files changed, 2 insertions(+), 59 deletions(-)

diff --git a/examples/llm/embedding_block_example.py b/examples/llm/embedding_block_example.py
index d47f044..ec477c7 100644
--- a/examples/llm/embedding_block_example.py
+++ b/examples/llm/embedding_block_example.py
@@ -58,61 +58,6 @@ def example_openai_embeddings():
     info = embedding_block.get_info()
     print(f"📊 Model info: {info['model']}")
     print(f"📊 Provider: {info['provider']}")
-    print(f"📊 Dimension: {info['dimension']}")
-
-
-def example_openai_text_embedding_3():
-    """Example using OpenAI text-embedding-3 with custom dimensions."""
-    print("\n=== OpenAI Text-Embedding-3 Example ===")
-
-    # Configuration for OpenAI text-embedding-3
-    config = EmbeddingConfig(
-        model="text-embedding-3-small",
-        api_key=os.getenv("OPENAI_API_KEY"),
-        dimensions=512,  # Custom dimension (default is 1536)
-        timeout=30,
-        encoding_format="float",
-    )
-
-    # Create embedding block
-    embedding_block = create_embedding_block(config)
-
-    # Test connection
-    if embedding_block.test_connection():
-        print("✅ OpenAI text-embedding-3 connection successful")
-    else:
-        print("❌ OpenAI text-embedding-3 connection failed")
-        return
-
-    # Generate single embedding
-    text = (
-        "This is a sample text for embedding generation with custom dimensions."
-    )
-    embedding = embedding_block.generate_embedding(text)
-
-    if embedding:
-        print(f"✅ Generated embedding with {len(embedding)} dimensions")
-        print(f"   First 5 values: {embedding[:5]}")
-
-    # Generate multiple embeddings
-    texts = [
-        "First sample text for embedding.",
-        "Second sample text with different content.",
-        "Third sample text for batch processing.",
-    ]
-
-    embeddings = embedding_block.generate_embeddings(texts)
-
-    if embeddings:
-        print(f"✅ Generated {len(embeddings)} embeddings")
-        for i, emb in enumerate(embeddings):
-            print(f"   Text {i + 1}: {len(emb)} dimensions")
-
-    # Get embedding information
-    info = embedding_block.get_info()
-    print(f"📊 Model info: {info['model']}")
-    print(f"📊 Provider: {info['provider']}")
-    print(f"📊 Dimension: {info['dimension']}")
 
 
 def example_azure_embeddings():
@@ -166,7 +111,6 @@ def example_azure_embeddings():
     info = embedding_block.get_info()
     print(f"📊 Model info: {info['model']}")
     print(f"📊 Provider: {info['provider']}")
-    print(f"📊 Dimension: {info['dimension']}")
 
 
 def example_configuration_variants():
@@ -241,7 +185,6 @@ def main():
     # Run examples based on available API keys
     if os.getenv("OPENAI_API_KEY"):
         example_openai_embeddings()
-        example_openai_text_embedding_3()
     else:
         print("\n⚠️  Skipping OpenAI examples - OPENAI_API_KEY not set")
 
diff --git a/quantmind/config/embedding.py b/quantmind/config/embedding.py
index 2633e75..1774d5f 100644
--- a/quantmind/config/embedding.py
+++ b/quantmind/config/embedding.py
@@ -110,7 +110,7 @@ def get_provider_type(self) -> str:
         elif "azure" in model_lower:
             return "azure"
 
-        # Cohere models
+        # Gemini models
         elif "gemini" in model_lower:
             return "gemini"
 
diff --git a/quantmind/llm/embedding.py b/quantmind/llm/embedding.py
index 3bf56db..3b1c85f 100644
--- a/quantmind/llm/embedding.py
+++ b/quantmind/llm/embedding.py
@@ -24,7 +24,7 @@ class EmbeddingBlock:
     """A reusable Embedding function block using LiteLLM.
 
     EmbeddingBlock provides a consistent interface for generating embeddings across
-    different providers (OpenAI, Anthropic, etc.).
+    different providers (OpenAI, Gemini, etc.).
 
     Unlike workflows, EmbeddingBlock focuses on providing basic embedding capabilities
     without business logic.