Merge branch 'dev' into feature/dax/devops-svc

This commit is contained in:
dax.li 2025-07-15 03:34:15 +00:00
commit 3ce7a7ec76
4 changed files with 11 additions and 1 deletions

View File

@ -20,6 +20,7 @@ class ContentDataFormat(IntEnum):
class ContentFileConstants:
COVER_FILE_NAME: str = "cover.png"
HOVER_FILE_NAME: str = "hover.png"
SUMMARY_FILE_NAME: str = "summary.txt"
TITLE_FILE_NAME: str = "title.txt"
CONTENT_LINK_FILE_NAME: str = "content.link"

View File

@ -60,6 +60,7 @@ class ContentSharePointManager:
content_type_mapping = {
ContentFileConstants.COVER_FILE_NAME: "cover_document_id",
ContentFileConstants.HOVER_FILE_NAME: "hover_document_id",
ContentFileConstants.SUMMARY_FILE_NAME: "summary_text_new",
ContentFileConstants.TITLE_FILE_NAME: "title_text_new",
ContentFileConstants.CONTENT_LINK_FILE_NAME: "content_link",
@ -90,6 +91,7 @@ class ContentSharePointManager:
content_directory = ContentDirectory(
content_name=sp_folder["name"],
cover_document_id=None,
hover_document_id=None,
summary_text=None,
title_text=None,
content_link=None,

View File

@ -1,3 +1,4 @@
from datetime import datetime, timedelta
from typing import Set
from backend.content.models import DocumentDoc
from backend.content.models import ContentFolderDoc
@ -32,11 +33,16 @@ class DocumentCleaner:
print(
f"Valid document IDs (from updated content directories): {valid_document_ids}"
)
# Calculate the time 1 day ago
time_1_day_ago = datetime.now(datetime.UTC) - timedelta(days=1)
# Retrieve all document IDs from DocumentDoc
all_document_ids = set()
async for doc in DocumentDoc.find(
{"created_by": {"$regex": "^content-service-"}}
{
"created_by": {"$regex": "^content-service-"},
"create_time": {"$lt": time_1_day_ago},
}
): # Fetch all documents that are created by content-service
if doc.document_id: # Ensure document_id is not None
all_document_ids.add(doc.document_id)

View File

@ -20,6 +20,7 @@ class ContentDirectory(BaseModel):
content_text: Optional[str] = None
content_text_new: Optional[str] = None
content_document_id: Optional[str] = None
hover_document_id: Optional[str] = None
class MediaType(IntEnum):