feat/datasource
parent
389f15f8e3
commit
d4007ae073
@ -1,234 +0,0 @@
|
|||||||
import base64
|
|
||||||
import hashlib
|
|
||||||
import hmac
|
|
||||||
import logging
|
|
||||||
import os
|
|
||||||
import time
|
|
||||||
from mimetypes import guess_extension, guess_type
|
|
||||||
from typing import Optional, Union
|
|
||||||
from uuid import uuid4
|
|
||||||
|
|
||||||
import httpx
|
|
||||||
|
|
||||||
from configs import dify_config
|
|
||||||
from core.helper import ssrf_proxy
|
|
||||||
from extensions.ext_database import db
|
|
||||||
from extensions.ext_storage import storage
|
|
||||||
from models.model import MessageFile
|
|
||||||
from models.tools import ToolFile
|
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
|
||||||
|
|
||||||
|
|
||||||
class ToolFileManager:
|
|
||||||
@staticmethod
|
|
||||||
def sign_file(tool_file_id: str, extension: str) -> str:
|
|
||||||
"""
|
|
||||||
sign file to get a temporary url
|
|
||||||
"""
|
|
||||||
base_url = dify_config.FILES_URL
|
|
||||||
file_preview_url = f"{base_url}/files/tools/{tool_file_id}{extension}"
|
|
||||||
|
|
||||||
timestamp = str(int(time.time()))
|
|
||||||
nonce = os.urandom(16).hex()
|
|
||||||
data_to_sign = f"file-preview|{tool_file_id}|{timestamp}|{nonce}"
|
|
||||||
secret_key = dify_config.SECRET_KEY.encode() if dify_config.SECRET_KEY else b""
|
|
||||||
sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest()
|
|
||||||
encoded_sign = base64.urlsafe_b64encode(sign).decode()
|
|
||||||
|
|
||||||
return f"{file_preview_url}?timestamp={timestamp}&nonce={nonce}&sign={encoded_sign}"
|
|
||||||
|
|
||||||
@staticmethod
|
|
||||||
def verify_file(file_id: str, timestamp: str, nonce: str, sign: str) -> bool:
|
|
||||||
"""
|
|
||||||
verify signature
|
|
||||||
"""
|
|
||||||
data_to_sign = f"file-preview|{file_id}|{timestamp}|{nonce}"
|
|
||||||
secret_key = dify_config.SECRET_KEY.encode() if dify_config.SECRET_KEY else b""
|
|
||||||
recalculated_sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest()
|
|
||||||
recalculated_encoded_sign = base64.urlsafe_b64encode(recalculated_sign).decode()
|
|
||||||
|
|
||||||
# verify signature
|
|
||||||
if sign != recalculated_encoded_sign:
|
|
||||||
return False
|
|
||||||
|
|
||||||
current_time = int(time.time())
|
|
||||||
return current_time - int(timestamp) <= dify_config.FILES_ACCESS_TIMEOUT
|
|
||||||
|
|
||||||
@staticmethod
|
|
||||||
def create_file_by_raw(
|
|
||||||
*,
|
|
||||||
user_id: str,
|
|
||||||
tenant_id: str,
|
|
||||||
conversation_id: Optional[str],
|
|
||||||
file_binary: bytes,
|
|
||||||
mimetype: str,
|
|
||||||
filename: Optional[str] = None,
|
|
||||||
) -> ToolFile:
|
|
||||||
extension = guess_extension(mimetype) or ".bin"
|
|
||||||
unique_name = uuid4().hex
|
|
||||||
unique_filename = f"{unique_name}{extension}"
|
|
||||||
# default just as before
|
|
||||||
present_filename = unique_filename
|
|
||||||
if filename is not None:
|
|
||||||
has_extension = len(filename.split(".")) > 1
|
|
||||||
# Add extension flexibly
|
|
||||||
present_filename = filename if has_extension else f"{filename}{extension}"
|
|
||||||
filepath = f"tools/{tenant_id}/{unique_filename}"
|
|
||||||
storage.save(filepath, file_binary)
|
|
||||||
|
|
||||||
tool_file = ToolFile(
|
|
||||||
user_id=user_id,
|
|
||||||
tenant_id=tenant_id,
|
|
||||||
conversation_id=conversation_id,
|
|
||||||
file_key=filepath,
|
|
||||||
mimetype=mimetype,
|
|
||||||
name=present_filename,
|
|
||||||
size=len(file_binary),
|
|
||||||
)
|
|
||||||
|
|
||||||
db.session.add(tool_file)
|
|
||||||
db.session.commit()
|
|
||||||
db.session.refresh(tool_file)
|
|
||||||
|
|
||||||
return tool_file
|
|
||||||
|
|
||||||
@staticmethod
|
|
||||||
def create_file_by_url(
|
|
||||||
user_id: str,
|
|
||||||
tenant_id: str,
|
|
||||||
file_url: str,
|
|
||||||
conversation_id: Optional[str] = None,
|
|
||||||
) -> ToolFile:
|
|
||||||
# try to download image
|
|
||||||
try:
|
|
||||||
response = ssrf_proxy.get(file_url)
|
|
||||||
response.raise_for_status()
|
|
||||||
blob = response.content
|
|
||||||
except httpx.TimeoutException:
|
|
||||||
raise ValueError(f"timeout when downloading file from {file_url}")
|
|
||||||
|
|
||||||
mimetype = (
|
|
||||||
guess_type(file_url)[0]
|
|
||||||
or response.headers.get("Content-Type", "").split(";")[0].strip()
|
|
||||||
or "application/octet-stream"
|
|
||||||
)
|
|
||||||
extension = guess_extension(mimetype) or ".bin"
|
|
||||||
unique_name = uuid4().hex
|
|
||||||
filename = f"{unique_name}{extension}"
|
|
||||||
filepath = f"tools/{tenant_id}/{filename}"
|
|
||||||
storage.save(filepath, blob)
|
|
||||||
|
|
||||||
tool_file = ToolFile(
|
|
||||||
user_id=user_id,
|
|
||||||
tenant_id=tenant_id,
|
|
||||||
conversation_id=conversation_id,
|
|
||||||
file_key=filepath,
|
|
||||||
mimetype=mimetype,
|
|
||||||
original_url=file_url,
|
|
||||||
name=filename,
|
|
||||||
size=len(blob),
|
|
||||||
)
|
|
||||||
|
|
||||||
db.session.add(tool_file)
|
|
||||||
db.session.commit()
|
|
||||||
|
|
||||||
return tool_file
|
|
||||||
|
|
||||||
@staticmethod
|
|
||||||
def get_file_binary(id: str) -> Union[tuple[bytes, str], None]:
|
|
||||||
"""
|
|
||||||
get file binary
|
|
||||||
|
|
||||||
:param id: the id of the file
|
|
||||||
|
|
||||||
:return: the binary of the file, mime type
|
|
||||||
"""
|
|
||||||
tool_file: ToolFile | None = (
|
|
||||||
db.session.query(ToolFile)
|
|
||||||
.filter(
|
|
||||||
ToolFile.id == id,
|
|
||||||
)
|
|
||||||
.first()
|
|
||||||
)
|
|
||||||
|
|
||||||
if not tool_file:
|
|
||||||
return None
|
|
||||||
|
|
||||||
blob = storage.load_once(tool_file.file_key)
|
|
||||||
|
|
||||||
return blob, tool_file.mimetype
|
|
||||||
|
|
||||||
@staticmethod
|
|
||||||
def get_file_binary_by_message_file_id(id: str) -> Union[tuple[bytes, str], None]:
|
|
||||||
"""
|
|
||||||
get file binary
|
|
||||||
|
|
||||||
:param id: the id of the file
|
|
||||||
|
|
||||||
:return: the binary of the file, mime type
|
|
||||||
"""
|
|
||||||
message_file: MessageFile | None = (
|
|
||||||
db.session.query(MessageFile)
|
|
||||||
.filter(
|
|
||||||
MessageFile.id == id,
|
|
||||||
)
|
|
||||||
.first()
|
|
||||||
)
|
|
||||||
|
|
||||||
# Check if message_file is not None
|
|
||||||
if message_file is not None:
|
|
||||||
# get tool file id
|
|
||||||
if message_file.url is not None:
|
|
||||||
tool_file_id = message_file.url.split("/")[-1]
|
|
||||||
# trim extension
|
|
||||||
tool_file_id = tool_file_id.split(".")[0]
|
|
||||||
else:
|
|
||||||
tool_file_id = None
|
|
||||||
else:
|
|
||||||
tool_file_id = None
|
|
||||||
|
|
||||||
tool_file: ToolFile | None = (
|
|
||||||
db.session.query(ToolFile)
|
|
||||||
.filter(
|
|
||||||
ToolFile.id == tool_file_id,
|
|
||||||
)
|
|
||||||
.first()
|
|
||||||
)
|
|
||||||
|
|
||||||
if not tool_file:
|
|
||||||
return None
|
|
||||||
|
|
||||||
blob = storage.load_once(tool_file.file_key)
|
|
||||||
|
|
||||||
return blob, tool_file.mimetype
|
|
||||||
|
|
||||||
@staticmethod
|
|
||||||
def get_file_generator_by_tool_file_id(tool_file_id: str):
|
|
||||||
"""
|
|
||||||
get file binary
|
|
||||||
|
|
||||||
:param tool_file_id: the id of the tool file
|
|
||||||
|
|
||||||
:return: the binary of the file, mime type
|
|
||||||
"""
|
|
||||||
tool_file: ToolFile | None = (
|
|
||||||
db.session.query(ToolFile)
|
|
||||||
.filter(
|
|
||||||
ToolFile.id == tool_file_id,
|
|
||||||
)
|
|
||||||
.first()
|
|
||||||
)
|
|
||||||
|
|
||||||
if not tool_file:
|
|
||||||
return None, None
|
|
||||||
|
|
||||||
stream = storage.load_stream(tool_file.file_key)
|
|
||||||
|
|
||||||
return stream, tool_file
|
|
||||||
|
|
||||||
|
|
||||||
# init tool_file_parser
|
|
||||||
from core.file.tool_file_parser import tool_file_manager
|
|
||||||
|
|
||||||
tool_file_manager["manager"] = ToolFileManager
|
|
||||||
@ -1,101 +0,0 @@
|
|||||||
from core.tools.__base.tool_provider import ToolProviderController
|
|
||||||
from core.tools.builtin_tool.provider import BuiltinToolProviderController
|
|
||||||
from core.tools.custom_tool.provider import ApiToolProviderController
|
|
||||||
from core.tools.entities.values import default_tool_label_name_list
|
|
||||||
from core.tools.workflow_as_tool.provider import WorkflowToolProviderController
|
|
||||||
from extensions.ext_database import db
|
|
||||||
from models.tools import ToolLabelBinding
|
|
||||||
|
|
||||||
|
|
||||||
class ToolLabelManager:
|
|
||||||
@classmethod
|
|
||||||
def filter_tool_labels(cls, tool_labels: list[str]) -> list[str]:
|
|
||||||
"""
|
|
||||||
Filter tool labels
|
|
||||||
"""
|
|
||||||
tool_labels = [label for label in tool_labels if label in default_tool_label_name_list]
|
|
||||||
return list(set(tool_labels))
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def update_tool_labels(cls, controller: ToolProviderController, labels: list[str]):
|
|
||||||
"""
|
|
||||||
Update tool labels
|
|
||||||
"""
|
|
||||||
labels = cls.filter_tool_labels(labels)
|
|
||||||
|
|
||||||
if isinstance(controller, ApiToolProviderController | WorkflowToolProviderController):
|
|
||||||
provider_id = controller.provider_id
|
|
||||||
else:
|
|
||||||
raise ValueError("Unsupported tool type")
|
|
||||||
|
|
||||||
# delete old labels
|
|
||||||
db.session.query(ToolLabelBinding).filter(ToolLabelBinding.tool_id == provider_id).delete()
|
|
||||||
|
|
||||||
# insert new labels
|
|
||||||
for label in labels:
|
|
||||||
db.session.add(
|
|
||||||
ToolLabelBinding(
|
|
||||||
tool_id=provider_id,
|
|
||||||
tool_type=controller.provider_type.value,
|
|
||||||
label_name=label,
|
|
||||||
)
|
|
||||||
)
|
|
||||||
|
|
||||||
db.session.commit()
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def get_tool_labels(cls, controller: ToolProviderController) -> list[str]:
|
|
||||||
"""
|
|
||||||
Get tool labels
|
|
||||||
"""
|
|
||||||
if isinstance(controller, ApiToolProviderController | WorkflowToolProviderController):
|
|
||||||
provider_id = controller.provider_id
|
|
||||||
elif isinstance(controller, BuiltinToolProviderController):
|
|
||||||
return controller.tool_labels
|
|
||||||
else:
|
|
||||||
raise ValueError("Unsupported tool type")
|
|
||||||
|
|
||||||
labels = (
|
|
||||||
db.session.query(ToolLabelBinding.label_name)
|
|
||||||
.filter(
|
|
||||||
ToolLabelBinding.tool_id == provider_id,
|
|
||||||
ToolLabelBinding.tool_type == controller.provider_type.value,
|
|
||||||
)
|
|
||||||
.all()
|
|
||||||
)
|
|
||||||
|
|
||||||
return [label.label_name for label in labels]
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def get_tools_labels(cls, tool_providers: list[ToolProviderController]) -> dict[str, list[str]]:
|
|
||||||
"""
|
|
||||||
Get tools labels
|
|
||||||
|
|
||||||
:param tool_providers: list of tool providers
|
|
||||||
|
|
||||||
:return: dict of tool labels
|
|
||||||
:key: tool id
|
|
||||||
:value: list of tool labels
|
|
||||||
"""
|
|
||||||
if not tool_providers:
|
|
||||||
return {}
|
|
||||||
|
|
||||||
for controller in tool_providers:
|
|
||||||
if not isinstance(controller, ApiToolProviderController | WorkflowToolProviderController):
|
|
||||||
raise ValueError("Unsupported tool type")
|
|
||||||
|
|
||||||
provider_ids = []
|
|
||||||
for controller in tool_providers:
|
|
||||||
assert isinstance(controller, ApiToolProviderController | WorkflowToolProviderController)
|
|
||||||
provider_ids.append(controller.provider_id)
|
|
||||||
|
|
||||||
labels: list[ToolLabelBinding] = (
|
|
||||||
db.session.query(ToolLabelBinding).filter(ToolLabelBinding.tool_id.in_(provider_ids)).all()
|
|
||||||
)
|
|
||||||
|
|
||||||
tool_labels: dict[str, list[str]] = {label.tool_id: [] for label in labels}
|
|
||||||
|
|
||||||
for label in labels:
|
|
||||||
tool_labels[label.tool_id].append(label.label_name)
|
|
||||||
|
|
||||||
return tool_labels
|
|
||||||
Loading…
Reference in New Issue