Spaces:
Paused
Paused
| import base64 | |
| import hashlib | |
| import hmac | |
| import logging | |
| import os | |
| import time | |
| from mimetypes import guess_extension, guess_type | |
| from typing import Optional, Union | |
| from uuid import uuid4 | |
| from httpx import get | |
| from configs import dify_config | |
| from extensions.ext_database import db | |
| from extensions.ext_storage import storage | |
| from models.model import MessageFile | |
| from models.tools import ToolFile | |
| logger = logging.getLogger(__name__) | |
| class ToolFileManager: | |
| def sign_file(tool_file_id: str, extension: str) -> str: | |
| """ | |
| sign file to get a temporary url | |
| """ | |
| base_url = dify_config.FILES_URL | |
| file_preview_url = f"{base_url}/files/tools/{tool_file_id}{extension}" | |
| timestamp = str(int(time.time())) | |
| nonce = os.urandom(16).hex() | |
| data_to_sign = f"file-preview|{tool_file_id}|{timestamp}|{nonce}" | |
| secret_key = dify_config.SECRET_KEY.encode() if dify_config.SECRET_KEY else b"" | |
| sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest() | |
| encoded_sign = base64.urlsafe_b64encode(sign).decode() | |
| return f"{file_preview_url}?timestamp={timestamp}&nonce={nonce}&sign={encoded_sign}" | |
| def verify_file(file_id: str, timestamp: str, nonce: str, sign: str) -> bool: | |
| """ | |
| verify signature | |
| """ | |
| data_to_sign = f"file-preview|{file_id}|{timestamp}|{nonce}" | |
| secret_key = dify_config.SECRET_KEY.encode() if dify_config.SECRET_KEY else b"" | |
| recalculated_sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest() | |
| recalculated_encoded_sign = base64.urlsafe_b64encode(recalculated_sign).decode() | |
| # verify signature | |
| if sign != recalculated_encoded_sign: | |
| return False | |
| current_time = int(time.time()) | |
| return current_time - int(timestamp) <= dify_config.FILES_ACCESS_TIMEOUT | |
| def create_file_by_raw( | |
| *, | |
| user_id: str, | |
| tenant_id: str, | |
| conversation_id: Optional[str], | |
| file_binary: bytes, | |
| mimetype: str, | |
| ) -> ToolFile: | |
| extension = guess_extension(mimetype) or ".bin" | |
| unique_name = uuid4().hex | |
| filename = f"{unique_name}{extension}" | |
| filepath = f"tools/{tenant_id}/{filename}" | |
| storage.save(filepath, file_binary) | |
| tool_file = ToolFile( | |
| user_id=user_id, | |
| tenant_id=tenant_id, | |
| conversation_id=conversation_id, | |
| file_key=filepath, | |
| mimetype=mimetype, | |
| name=filename, | |
| size=len(file_binary), | |
| ) | |
| db.session.add(tool_file) | |
| db.session.commit() | |
| db.session.refresh(tool_file) | |
| return tool_file | |
| def create_file_by_url( | |
| user_id: str, | |
| tenant_id: str, | |
| conversation_id: str | None, | |
| file_url: str, | |
| ) -> ToolFile: | |
| # try to download image | |
| try: | |
| response = get(file_url) | |
| response.raise_for_status() | |
| blob = response.content | |
| except Exception as e: | |
| logger.error(f"Failed to download file from {file_url}: {e}") | |
| raise | |
| mimetype = guess_type(file_url)[0] or "octet/stream" | |
| extension = guess_extension(mimetype) or ".bin" | |
| unique_name = uuid4().hex | |
| filename = f"{unique_name}{extension}" | |
| filepath = f"tools/{tenant_id}/{filename}" | |
| storage.save(filepath, blob) | |
| tool_file = ToolFile( | |
| user_id=user_id, | |
| tenant_id=tenant_id, | |
| conversation_id=conversation_id, | |
| file_key=filepath, | |
| mimetype=mimetype, | |
| original_url=file_url, | |
| name=filename, | |
| size=len(blob), | |
| ) | |
| db.session.add(tool_file) | |
| db.session.commit() | |
| return tool_file | |
| def get_file_binary(id: str) -> Union[tuple[bytes, str], None]: | |
| """ | |
| get file binary | |
| :param id: the id of the file | |
| :return: the binary of the file, mime type | |
| """ | |
| tool_file = ( | |
| db.session.query(ToolFile) | |
| .filter( | |
| ToolFile.id == id, | |
| ) | |
| .first() | |
| ) | |
| if not tool_file: | |
| return None | |
| blob = storage.load_once(tool_file.file_key) | |
| return blob, tool_file.mimetype | |
| def get_file_binary_by_message_file_id(id: str) -> Union[tuple[bytes, str], None]: | |
| """ | |
| get file binary | |
| :param id: the id of the file | |
| :return: the binary of the file, mime type | |
| """ | |
| message_file = ( | |
| db.session.query(MessageFile) | |
| .filter( | |
| MessageFile.id == id, | |
| ) | |
| .first() | |
| ) | |
| # Check if message_file is not None | |
| if message_file is not None: | |
| # get tool file id | |
| if message_file.url is not None: | |
| tool_file_id = message_file.url.split("/")[-1] | |
| # trim extension | |
| tool_file_id = tool_file_id.split(".")[0] | |
| else: | |
| tool_file_id = None | |
| else: | |
| tool_file_id = None | |
| tool_file = ( | |
| db.session.query(ToolFile) | |
| .filter( | |
| ToolFile.id == tool_file_id, | |
| ) | |
| .first() | |
| ) | |
| if not tool_file: | |
| return None | |
| blob = storage.load_once(tool_file.file_key) | |
| return blob, tool_file.mimetype | |
| def get_file_generator_by_tool_file_id(tool_file_id: str): | |
| """ | |
| get file binary | |
| :param tool_file_id: the id of the tool file | |
| :return: the binary of the file, mime type | |
| """ | |
| tool_file = ( | |
| db.session.query(ToolFile) | |
| .filter( | |
| ToolFile.id == tool_file_id, | |
| ) | |
| .first() | |
| ) | |
| if not tool_file: | |
| return None, None | |
| stream = storage.load_stream(tool_file.file_key) | |
| return stream, tool_file | |
| # init tool_file_parser | |
| from core.file.tool_file_parser import tool_file_manager | |
| tool_file_manager["manager"] = ToolFileManager | |