|
import base64 |
|
import hashlib |
|
import hmac |
|
import logging |
|
import os |
|
import time |
|
from mimetypes import guess_extension, guess_type |
|
from typing import Optional, Union |
|
from uuid import uuid4 |
|
|
|
from httpx import get |
|
|
|
from configs import dify_config |
|
from extensions.ext_database import db |
|
from extensions.ext_storage import storage |
|
from models.model import MessageFile |
|
from models.tools import ToolFile |
|
|
|
logger = logging.getLogger(__name__) |
|
|
|
|
|
class ToolFileManager: |
|
@staticmethod |
|
def sign_file(tool_file_id: str, extension: str) -> str: |
|
""" |
|
sign file to get a temporary url |
|
""" |
|
base_url = dify_config.FILES_URL |
|
file_preview_url = f"{base_url}/files/tools/{tool_file_id}{extension}" |
|
|
|
timestamp = str(int(time.time())) |
|
nonce = os.urandom(16).hex() |
|
data_to_sign = f"file-preview|{tool_file_id}|{timestamp}|{nonce}" |
|
secret_key = dify_config.SECRET_KEY.encode() if dify_config.SECRET_KEY else b"" |
|
sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest() |
|
encoded_sign = base64.urlsafe_b64encode(sign).decode() |
|
|
|
return f"{file_preview_url}?timestamp={timestamp}&nonce={nonce}&sign={encoded_sign}" |
|
|
|
@staticmethod |
|
def verify_file(file_id: str, timestamp: str, nonce: str, sign: str) -> bool: |
|
""" |
|
verify signature |
|
""" |
|
data_to_sign = f"file-preview|{file_id}|{timestamp}|{nonce}" |
|
secret_key = dify_config.SECRET_KEY.encode() if dify_config.SECRET_KEY else b"" |
|
recalculated_sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest() |
|
recalculated_encoded_sign = base64.urlsafe_b64encode(recalculated_sign).decode() |
|
|
|
|
|
if sign != recalculated_encoded_sign: |
|
return False |
|
|
|
current_time = int(time.time()) |
|
return current_time - int(timestamp) <= dify_config.FILES_ACCESS_TIMEOUT |
|
|
|
@staticmethod |
|
def create_file_by_raw( |
|
*, |
|
user_id: str, |
|
tenant_id: str, |
|
conversation_id: Optional[str], |
|
file_binary: bytes, |
|
mimetype: str, |
|
) -> ToolFile: |
|
extension = guess_extension(mimetype) or ".bin" |
|
unique_name = uuid4().hex |
|
filename = f"{unique_name}{extension}" |
|
filepath = f"tools/{tenant_id}/{filename}" |
|
storage.save(filepath, file_binary) |
|
|
|
tool_file = ToolFile( |
|
user_id=user_id, |
|
tenant_id=tenant_id, |
|
conversation_id=conversation_id, |
|
file_key=filepath, |
|
mimetype=mimetype, |
|
name=filename, |
|
size=len(file_binary), |
|
) |
|
|
|
db.session.add(tool_file) |
|
db.session.commit() |
|
db.session.refresh(tool_file) |
|
|
|
return tool_file |
|
|
|
@staticmethod |
|
def create_file_by_url( |
|
user_id: str, |
|
tenant_id: str, |
|
conversation_id: str | None, |
|
file_url: str, |
|
) -> ToolFile: |
|
|
|
try: |
|
response = get(file_url) |
|
response.raise_for_status() |
|
blob = response.content |
|
except Exception as e: |
|
logger.error(f"Failed to download file from {file_url}: {e}") |
|
raise |
|
|
|
mimetype = guess_type(file_url)[0] or "octet/stream" |
|
extension = guess_extension(mimetype) or ".bin" |
|
unique_name = uuid4().hex |
|
filename = f"{unique_name}{extension}" |
|
filepath = f"tools/{tenant_id}/{filename}" |
|
storage.save(filepath, blob) |
|
|
|
tool_file = ToolFile( |
|
user_id=user_id, |
|
tenant_id=tenant_id, |
|
conversation_id=conversation_id, |
|
file_key=filepath, |
|
mimetype=mimetype, |
|
original_url=file_url, |
|
name=filename, |
|
size=len(blob), |
|
) |
|
|
|
db.session.add(tool_file) |
|
db.session.commit() |
|
|
|
return tool_file |
|
|
|
@staticmethod |
|
def get_file_binary(id: str) -> Union[tuple[bytes, str], None]: |
|
""" |
|
get file binary |
|
|
|
:param id: the id of the file |
|
|
|
:return: the binary of the file, mime type |
|
""" |
|
tool_file = ( |
|
db.session.query(ToolFile) |
|
.filter( |
|
ToolFile.id == id, |
|
) |
|
.first() |
|
) |
|
|
|
if not tool_file: |
|
return None |
|
|
|
blob = storage.load_once(tool_file.file_key) |
|
|
|
return blob, tool_file.mimetype |
|
|
|
@staticmethod |
|
def get_file_binary_by_message_file_id(id: str) -> Union[tuple[bytes, str], None]: |
|
""" |
|
get file binary |
|
|
|
:param id: the id of the file |
|
|
|
:return: the binary of the file, mime type |
|
""" |
|
message_file = ( |
|
db.session.query(MessageFile) |
|
.filter( |
|
MessageFile.id == id, |
|
) |
|
.first() |
|
) |
|
|
|
|
|
if message_file is not None: |
|
|
|
if message_file.url is not None: |
|
tool_file_id = message_file.url.split("/")[-1] |
|
|
|
tool_file_id = tool_file_id.split(".")[0] |
|
else: |
|
tool_file_id = None |
|
else: |
|
tool_file_id = None |
|
|
|
tool_file = ( |
|
db.session.query(ToolFile) |
|
.filter( |
|
ToolFile.id == tool_file_id, |
|
) |
|
.first() |
|
) |
|
|
|
if not tool_file: |
|
return None |
|
|
|
blob = storage.load_once(tool_file.file_key) |
|
|
|
return blob, tool_file.mimetype |
|
|
|
@staticmethod |
|
def get_file_generator_by_tool_file_id(tool_file_id: str): |
|
""" |
|
get file binary |
|
|
|
:param tool_file_id: the id of the tool file |
|
|
|
:return: the binary of the file, mime type |
|
""" |
|
tool_file = ( |
|
db.session.query(ToolFile) |
|
.filter( |
|
ToolFile.id == tool_file_id, |
|
) |
|
.first() |
|
) |
|
|
|
if not tool_file: |
|
return None, None |
|
|
|
stream = storage.load_stream(tool_file.file_key) |
|
|
|
return stream, tool_file |
|
|
|
|
|
|
|
from core.file.tool_file_parser import tool_file_manager |
|
|
|
tool_file_manager["manager"] = ToolFileManager |
|
|