Fix/memory celery fix (#168)

* refactor(celery): optimize task routing and worker configuration - Simplify Celery queue configuration with single default 'io_tasks' queue - Implement task routing strategy separating IO-bound and CPU-bound tasks - Add Flower monitoring support with task event tracking enabled - Add summary node search optimization to only retrieve summary nodes - Clean up unused imports and reorganize import statements for consistency - Update docker-compose configuration to support multi-queue worker setup * chore(celery): simplify flower configuration and add gevent dependency * chore(dependencies): add gevent dependency to requirements - Add gevent==24.11.1 to api/requirements.txt - Gevent is required for async worker support in Celery - Complements existing flower and celery configuration * refactor(celery): simplify async event loop handling and reorganize task queues - Replace complex nest_asyncio and manual event loop management with asyncio.run() in read_message_task, write_message_task, regenerate_memory_cache, and workspace_reflection_task - Rename task queues from io_tasks/cpu_tasks to memory_tasks/document_tasks for better semantic clarity - Update task routing configuration to reflect new queue names for memory agent tasks and document processing tasks - Remove redundant exception handling comments and simplify error handling logic - Update README with improved community support section including GitHub Issues, Pull Requests, Discussions, and WeChat community links - Simplifies event loop management by leveraging asyncio.run() which handles loop creation and cleanup automatically, reducing code complexity and potential race conditions
2026-01-21 17:58:46 +08:00
parent 37ef497f4c
commit c24fb73147
12 changed files with 254 additions and 259 deletions
--- a/api/app/core/validators/memory_config_validators.py
+++ b/api/app/core/validators/memory_config_validators.py
@@ -89,14 +89,15 @@ def validate_model_exists_and_active(
    start_time = time.time()
    
    try:
-        # First check if model exists at all (without tenant filtering)
-        model_without_tenant = ModelConfigRepository.get_by_id(db, model_id, tenant_id=None)
-        
-        # Then check with tenant filtering
+        # OPTIMIZED: Single query with tenant filter
+        # We'll check tenant mismatch in the error handling
        model = ModelConfigRepository.get_by_id(db, model_id, tenant_id)
        elapsed_ms = (time.time() - start_time) * 1000
        
        if not model:
+            # Model not found with tenant filter - check if it exists without filter
+            model_without_tenant = ModelConfigRepository.get_by_id(db, model_id, tenant_id=None)
+            
            if model_without_tenant:
                # Model exists but belongs to different tenant
                logger.warning(
@@ -208,8 +209,11 @@ def validate_embedding_model(
    db: Session,
    tenant_id: Optional[UUID] = None,
    workspace_id: Optional[UUID] = None
-) -> UUID:
-    """Validate that embedding model is available and return its UUID.
+) -> tuple[UUID, str]:
+    """Validate that embedding model is available and return its UUID and name.
+    
+    Returns:
+        Tuple of (embedding_uuid, embedding_name)
    
    Raises:
        InvalidConfigError: If embedding_id is not provided or invalid
@@ -225,14 +229,19 @@ def validate_embedding_model(
            workspace_id=workspace_id
        )
    
-    embedding_uuid, _ = validate_and_resolve_model_id(
+    embedding_uuid, embedding_name = validate_and_resolve_model_id(
        embedding_id, "embedding", db, tenant_id, required=True,
        config_id=config_id, workspace_id=workspace_id
    )
-    print(100*'-')
-    print(embedding_uuid)
-    print(_)
-    print(100*'-')
+    
+    logger.debug(
+        "Embedding model validated",
+        extra={
+            "embedding_uuid": str(embedding_uuid),
+            "embedding_name": embedding_name,
+            "config_id": config_id
+        }
+    )
    
    if embedding_uuid is None:
        raise InvalidConfigError(
@@ -243,7 +252,7 @@ def validate_embedding_model(
            workspace_id=workspace_id
        )
    
-    return embedding_uuid
+    return embedding_uuid, embedding_name


 def validate_llm_model(