Files
MemoryBear/api/app/repositories/document_repository.py

154 lines
5.4 KiB
Python

import uuid
import datetime
from sqlalchemy.orm import Session
from app.models.document_model import Document
from app.schemas import document_schema
from app.core.logging_config import get_db_logger
# Obtain a dedicated logger for the database
db_logger = get_db_logger()
def get_documents_paginated(
db: Session,
filters: list,
page: int,
pagesize: int,
orderby: str = None,
desc: bool = False
) -> tuple[int, list]:
"""
Paged query document (with filtering and sorting)
"""
db_logger.debug(f"Query documents in pages: page={page}, pagesize={pagesize}, orderby={orderby}, desc={desc}, filters_count={len(filters)}")
try:
query = db.query(Document)
# Apply filter conditions
for filter_cond in filters:
query = query.filter(filter_cond)
# Calculate the total count (for pagination)
total = query.count()
db_logger.debug(f"Total number of document queries: {total}")
# sort
if orderby:
order_attr = getattr(Document, orderby, None)
if order_attr is not None:
if desc:
query = query.order_by(order_attr.desc())
else:
query = query.order_by(order_attr.asc())
db_logger.debug(f"sort: {orderby}, desc={desc}")
# pagination
items = query.offset((page - 1) * pagesize).limit(pagesize).all()
db_logger.info(f"The document paging query has been successful: total={total}, Number of current page={len(items)}")
return total, [document_schema.Document.model_validate(item) for item in items]
except Exception as e:
db_logger.error(f"Querying document pagination failed: page={page}, pagesize={pagesize} - {str(e)}")
raise
def create_document(db: Session, document: document_schema.DocumentCreate) -> Document:
db_logger.debug(f"Create a document record: file_name={document.file_name}")
try:
db_document = Document(**document.model_dump())
db.add(db_document)
db.commit()
db_logger.info(f"Document record created successfully: {document.file_name} (ID: {db_document.id})")
return db_document
except Exception as e:
db_logger.error(f"Failed to create a document record: title={document.file_name} - {str(e)}")
db.rollback()
raise
def get_document_by_id(db: Session, document_id: uuid.UUID) -> Document | None:
db_logger.debug(f"Query documents based on ID: document_id={document_id}")
try:
document = db.query(Document).filter(Document.id == document_id).first()
if document:
db_logger.debug(f"Document query successful: {document.file_name} (ID: {document_id})")
else:
db_logger.debug(f"Document does not exist: document_id={document_id}")
return document
except Exception as e:
db_logger.error(f"Failed to query the document based on the ID: document_id={document_id} - {str(e)}")
raise
def reset_documents_progress_by_kb_id(db: Session, kb_id: uuid.UUID) -> int:
"""
Reset the processing progress of all documents under the specified knowledge base
Args:
db: database session
kb_id: Knowledge Base ID
Returns:
int: Number of updated documents
"""
db_logger.debug(f"Reset the processing progress of all documents under the specified knowledge base: kb_id={kb_id}")
try:
# Build update conditions
filters = [
Document.kb_id == kb_id
]
# Build updated data
update_data = {
Document.chunk_num: 0,
Document.progress: 0,
Document.progress_msg: "Pending",
Document.process_duration: 0,
Document.run: 0, # Reset run status
Document.updated_at: datetime.datetime.now()
}
# Perform batch update
result = db.query(Document).filter(*filters).update(
update_data,
synchronize_session=False
)
# commit transaction
db.commit()
db_logger.debug(f"Successfully reset the processing progress of all documents under the specified knowledge base: kb_id: {kb_id}")
return result
except Exception as e:
db.rollback()
db_logger.error(f"Failed to reset the processing progress of all documents under the specified knowledge base: kb_id={kb_id} - {str(e)}")
raise
def delete_document_by_id(db: Session, document_id: uuid.UUID):
db_logger.debug(f"Delete document record: document_id={document_id}")
try:
# First, query the document information for logging purposes
document = db.query(Document).filter(Document.id == document_id).first()
if document:
file_name = document.file_name
else:
file_name = "unknown"
result = db.query(Document).filter(Document.id == document_id).delete()
db.commit()
if result > 0:
db_logger.info(f"Document record deleted successfully: {file_name} (ID: {document_id})")
else:
db_logger.warning(f"The document record does not exist, and cannot be deleted: document_id={document_id}")
except Exception as e:
db_logger.error(f"Failed to delete document record: document_id={document_id} - {str(e)}")
db.rollback()
raise