ميزة: إضافة خدمة تحليلات لتكامل Google Analytics اختبار: تحديث اختبارات خدمة واجهة برمجة التطبيقات (API) لتعكس تغييرات نقاط النهاية إصلاح: تعديل خدمة واجهة برمجة التطبيقات (API) لدعم تحميل ملفات متعددة ومصادقة المستخدم ميزة: تطبيق مخزن مصادقة باستخدام Zustand لإدارة المستخدمين إصلاح: تحسين إعدادات Nginx لتعزيز الأمان ودعم التحليلات
225 lines
6.3 KiB
Python
225 lines
6.3 KiB
Python
"""Celery tasks for PDF conversion (PDF↔Word)."""
|
|
import os
|
|
import logging
|
|
|
|
from flask import current_app
|
|
|
|
from app.extensions import celery
|
|
from app.services.pdf_service import pdf_to_word, word_to_pdf, PDFConversionError
|
|
from app.services.storage_service import storage
|
|
from app.services.task_tracking_service import finalize_task_tracking
|
|
from app.utils.sanitizer import cleanup_task_files
|
|
|
|
|
|
def _cleanup(task_id: str):
|
|
"""Cleanup with local-aware flag."""
|
|
cleanup_task_files(task_id, keep_outputs=not storage.use_s3)
|
|
|
|
|
|
def _get_output_dir(task_id: str) -> str:
|
|
"""Resolve output directory from app config."""
|
|
output_dir = os.path.join(current_app.config["OUTPUT_FOLDER"], task_id)
|
|
os.makedirs(output_dir, exist_ok=True)
|
|
return output_dir
|
|
|
|
|
|
def _finalize_task(
|
|
task_id: str,
|
|
user_id: int | None,
|
|
tool: str,
|
|
original_filename: str,
|
|
result: dict,
|
|
usage_source: str,
|
|
api_key_id: int | None,
|
|
celery_task_id: str | None,
|
|
):
|
|
"""Persist optional history and cleanup task files."""
|
|
finalize_task_tracking(
|
|
user_id=user_id,
|
|
tool=tool,
|
|
original_filename=original_filename,
|
|
result=result,
|
|
usage_source=usage_source,
|
|
api_key_id=api_key_id,
|
|
celery_task_id=celery_task_id,
|
|
)
|
|
_cleanup(task_id)
|
|
return result
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
@celery.task(bind=True, name="app.tasks.convert_tasks.convert_pdf_to_word")
|
|
def convert_pdf_to_word(
|
|
self,
|
|
input_path: str,
|
|
task_id: str,
|
|
original_filename: str,
|
|
user_id: int | None = None,
|
|
usage_source: str = "web",
|
|
api_key_id: int | None = None,
|
|
):
|
|
"""
|
|
Async task: Convert PDF to Word document.
|
|
|
|
Args:
|
|
input_path: Path to the uploaded PDF file
|
|
task_id: Unique task identifier
|
|
original_filename: Original filename for download
|
|
|
|
Returns:
|
|
dict with download_url and file info
|
|
"""
|
|
output_dir = _get_output_dir(task_id)
|
|
|
|
try:
|
|
self.update_state(state="PROCESSING", meta={"step": "Converting PDF to Word..."})
|
|
|
|
# Convert using LibreOffice
|
|
output_path = pdf_to_word(input_path, output_dir)
|
|
|
|
self.update_state(state="PROCESSING", meta={"step": "Uploading result..."})
|
|
|
|
# Upload to S3
|
|
s3_key = storage.upload_file(output_path, task_id, folder="outputs")
|
|
|
|
# Generate download filename
|
|
name_without_ext = os.path.splitext(original_filename)[0]
|
|
download_name = f"{name_without_ext}.docx"
|
|
|
|
# Generate presigned URL
|
|
download_url = storage.generate_presigned_url(
|
|
s3_key, original_filename=download_name
|
|
)
|
|
|
|
result = {
|
|
"status": "completed",
|
|
"download_url": download_url,
|
|
"filename": download_name,
|
|
"output_size": os.path.getsize(output_path),
|
|
}
|
|
|
|
# Cleanup local files
|
|
logger.info(f"Task {task_id}: PDF→Word conversion completed")
|
|
return _finalize_task(
|
|
task_id,
|
|
user_id,
|
|
"pdf-to-word",
|
|
original_filename,
|
|
result,
|
|
usage_source,
|
|
api_key_id,
|
|
self.request.id,
|
|
)
|
|
|
|
except PDFConversionError as e:
|
|
logger.error(f"Task {task_id}: Conversion error — {e}")
|
|
return _finalize_task(
|
|
task_id,
|
|
user_id,
|
|
"pdf-to-word",
|
|
original_filename,
|
|
{"status": "failed", "error": str(e)},
|
|
usage_source,
|
|
api_key_id,
|
|
self.request.id,
|
|
)
|
|
|
|
except Exception as e:
|
|
logger.error(f"Task {task_id}: Unexpected error — {e}")
|
|
return _finalize_task(
|
|
task_id,
|
|
user_id,
|
|
"pdf-to-word",
|
|
original_filename,
|
|
{"status": "failed", "error": "An unexpected error occurred."},
|
|
usage_source,
|
|
api_key_id,
|
|
self.request.id,
|
|
)
|
|
|
|
|
|
@celery.task(bind=True, name="app.tasks.convert_tasks.convert_word_to_pdf")
|
|
def convert_word_to_pdf(
|
|
self,
|
|
input_path: str,
|
|
task_id: str,
|
|
original_filename: str,
|
|
user_id: int | None = None,
|
|
usage_source: str = "web",
|
|
api_key_id: int | None = None,
|
|
):
|
|
"""
|
|
Async task: Convert Word document to PDF.
|
|
|
|
Args:
|
|
input_path: Path to the uploaded Word file
|
|
task_id: Unique task identifier
|
|
original_filename: Original filename for download
|
|
|
|
Returns:
|
|
dict with download_url and file info
|
|
"""
|
|
output_dir = _get_output_dir(task_id)
|
|
|
|
try:
|
|
self.update_state(state="PROCESSING", meta={"step": "Converting Word to PDF..."})
|
|
|
|
output_path = word_to_pdf(input_path, output_dir)
|
|
|
|
self.update_state(state="PROCESSING", meta={"step": "Uploading result..."})
|
|
|
|
s3_key = storage.upload_file(output_path, task_id, folder="outputs")
|
|
|
|
name_without_ext = os.path.splitext(original_filename)[0]
|
|
download_name = f"{name_without_ext}.pdf"
|
|
|
|
download_url = storage.generate_presigned_url(
|
|
s3_key, original_filename=download_name
|
|
)
|
|
|
|
result = {
|
|
"status": "completed",
|
|
"download_url": download_url,
|
|
"filename": download_name,
|
|
"output_size": os.path.getsize(output_path),
|
|
}
|
|
|
|
logger.info(f"Task {task_id}: Word→PDF conversion completed")
|
|
return _finalize_task(
|
|
task_id,
|
|
user_id,
|
|
"word-to-pdf",
|
|
original_filename,
|
|
result,
|
|
usage_source,
|
|
api_key_id,
|
|
self.request.id,
|
|
)
|
|
|
|
except PDFConversionError as e:
|
|
logger.error(f"Task {task_id}: Conversion error — {e}")
|
|
return _finalize_task(
|
|
task_id,
|
|
user_id,
|
|
"word-to-pdf",
|
|
original_filename,
|
|
{"status": "failed", "error": str(e)},
|
|
usage_source,
|
|
api_key_id,
|
|
self.request.id,
|
|
)
|
|
|
|
except Exception as e:
|
|
logger.error(f"Task {task_id}: Unexpected error — {e}")
|
|
return _finalize_task(
|
|
task_id,
|
|
user_id,
|
|
"word-to-pdf",
|
|
original_filename,
|
|
{"status": "failed", "error": "An unexpected error occurred."},
|
|
usage_source,
|
|
api_key_id,
|
|
self.request.id,
|
|
)
|