import logging from pathlib import Path from typing import Sequence import boto3 from boto3 import Session from botocore.exceptions import ClientError from django.conf import settings from pyblackbird_cc.resources.utils import _get_pdf_collection_type logger = logging.getLogger(__name__) def get_presigned_obj_url(bucket_name, obj_name, expiration=3600) -> str | None: client = boto3.client( "s3", endpoint_url=settings.AWS_S3_ENDPOINT_URL, aws_access_key_id=settings.AWS_ACCESS_KEY_ID, aws_secret_access_key=settings.AWS_SECRET_ACCESS_KEY, region_name=settings.AWS_S3_REGION_NAME, ) logger.info("Client created", extra={"client": client}) try: response = client.generate_presigned_url( "get_object", Params={"Bucket": bucket_name, "Key": obj_name}, ExpiresIn=expiration, ) except ClientError as e: logger.exception("Error generating presigned URL", extra={"error": e}) return None return response def get_s3_client() -> Session.client: return boto3.Session().client( "s3", endpoint_url=settings.AWS_S3_ENDPOINT_URL, aws_access_key_id=settings.AWS_ACCESS_KEY_ID, aws_secret_access_key=settings.AWS_SECRET_ACCESS_KEY, region_name=settings.AWS_S3_REGION_NAME ) def upload_files_to_s3(files: Sequence, dir_name: str) -> None: """ Generic upload function. Pass "thumbnails" or "pdfuploads" as dir_name to dictate the type of file to upload. :param files: :param dir_name: :return: """ s3_client = get_s3_client() for file in files: logging.info(f"Uploading {file.name} to S3") s3_client.upload_fileobj( file, settings.AWS_STORAGE_BUCKET_NAME, f"{dir_name}/{file.name}" ) def upload_snapshotted_pages_to_s3(snapshotted_pages): s3_client = get_s3_client() collection_type = _get_pdf_collection_type(snapshotted_pages) if collection_type in ["SINGLE_PDF_SINGLE_PAGE", "SINGLE_PDF_MULTI_PAGE"]: for img in snapshotted_pages[0]: logging.info(f"Uploading {img} to S3") s3_client.upload_file( img, settings.AWS_STORAGE_BUCKET_NAME, f"snapshotted_pages/{Path(img).name}" ) return True if collection_type in ["MULTI_PDF_SINGLE_PAGE", "MULTI_PDF_MULTI_PAGE"]: for pdf in snapshotted_pages: for img in pdf: logging.info(f"Uploading {img} to S3") s3_client.upload_file( img, settings.AWS_STORAGE_BUCKET_NAME, f"snapshotted_pages/{Path(img).name}" ) return True return False def upload_to_s3(pdf_files, thumbnail_files, snapshotted_pages) -> bool: """ :param pdf_files: a list of PDF files :param thumbnail_files: a list of thumbnail files :param snapshotted_pages: a list of snapshotted pages :return: True if the files was uploaded, False otherwise """ try: upload_files_to_s3(pdf_files, dir_name='pdfuploads') upload_files_to_s3(thumbnail_files, dir_name='thumbnails') return upload_snapshotted_pages_to_s3(snapshotted_pages) except ClientError: logging.exception("Error uploading files to S3") return False