support bedrock kb: retrieve and generate (#13027)

1 year ago · b2bbc28580
parent 59b3e672aa
commit b2bbc28580
5 changed files with 813 additions and 18 deletions
--- a/api/core/tools/provider/builtin/aws/tools/bedrock_config.py
+++ b/api/core/tools/provider/builtin/aws/tools/bedrock_config.py
@ -0,0 +1,114 @@
 """
 Configuration classes for AWS Bedrock retrieve and generate API
 """
 from dataclasses import dataclass
 from typing import Any, Literal, Optional
@dataclass
 class TextInferenceConfig:
    """Text inference configuration"""
    maxTokens: Optional[int] = None
    stopSequences: Optional[list[str]] = None
    temperature: Optional[float] = None
    topP: Optional[float] = None
@dataclass
 class PerformanceConfig:
    """Performance configuration"""
    latency: Literal["standard", "optimized"]
@dataclass
 class PromptTemplate:
    """Prompt template configuration"""
    textPromptTemplate: str
@dataclass
 class GuardrailConfig:
    """Guardrail configuration"""
    guardrailId: str
    guardrailVersion: str
@dataclass
 class GenerationConfig:
    """Generation configuration"""
    additionalModelRequestFields: Optional[dict[str, Any]] = None
    guardrailConfiguration: Optional[GuardrailConfig] = None
    inferenceConfig: Optional[dict[str, TextInferenceConfig]] = None
    performanceConfig: Optional[PerformanceConfig] = None
    promptTemplate: Optional[PromptTemplate] = None
@dataclass
 class VectorSearchConfig:
    """Vector search configuration"""
    filter: Optional[dict[str, Any]] = None
    numberOfResults: Optional[int] = None
    overrideSearchType: Optional[Literal["HYBRID", "SEMANTIC"]] = None
@dataclass
 class RetrievalConfig:
    """Retrieval configuration"""
    vectorSearchConfiguration: VectorSearchConfig
@dataclass
 class OrchestrationConfig:
    """Orchestration configuration"""
    additionalModelRequestFields: Optional[dict[str, Any]] = None
    inferenceConfig: Optional[dict[str, TextInferenceConfig]] = None
    performanceConfig: Optional[PerformanceConfig] = None
    promptTemplate: Optional[PromptTemplate] = None
@dataclass
 class KnowledgeBaseConfig:
    """Knowledge base configuration"""
    generationConfiguration: GenerationConfig
    knowledgeBaseId: str
    modelArn: str
    orchestrationConfiguration: Optional[OrchestrationConfig] = None
    retrievalConfiguration: Optional[RetrievalConfig] = None
@dataclass
 class SessionConfig:
    """Session configuration"""
    kmsKeyArn: Optional[str] = None
    sessionId: Optional[str] = None
@dataclass
 class RetrieveAndGenerateConfiguration:
    """Retrieve and generate configuration
    The use of knowledgeBaseConfiguration or externalSourcesConfiguration depends on the type value
    """
    type: str = "KNOWLEDGE_BASE"
    knowledgeBaseConfiguration: Optional[KnowledgeBaseConfig] = None
@dataclass
 class RetrieveAndGenerateConfig:
    """Retrieve and generate main configuration"""
    input: dict[str, str]
    retrieveAndGenerateConfiguration: RetrieveAndGenerateConfiguration
    sessionConfiguration: Optional[SessionConfig] = None
    sessionId: Optional[str] = None
--- a/api/core/tools/provider/builtin/aws/tools/bedrock_retrieve_and_generate.py
+++ b/api/core/tools/provider/builtin/aws/tools/bedrock_retrieve_and_generate.py
@ -0,0 +1,324 @@
 import json
 from typing import Any, Optional
 import boto3
 from core.tools.entities.tool_entities import ToolInvokeMessage
 from core.tools.tool.builtin_tool import BuiltinTool
 class BedrockRetrieveAndGenerateTool(BuiltinTool):
    bedrock_client: Any = None
    def _create_text_inference_config(
        self,
        max_tokens: Optional[int] = None,
        stop_sequences: Optional[str] = None,
        temperature: Optional[float] = None,
        top_p: Optional[float] = None,
    ) -> Optional[dict]:
        """Create text inference configuration"""
        if any([max_tokens, stop_sequences, temperature, top_p]):
            config = {}
            if max_tokens is not None:
                config["maxTokens"] = max_tokens
            if stop_sequences:
                try:
                    config["stopSequences"] = json.loads(stop_sequences)
                except json.JSONDecodeError:
                    config["stopSequences"] = []
            if temperature is not None:
                config["temperature"] = temperature
            if top_p is not None:
                config["topP"] = top_p
            return config
        return None
    def _create_guardrail_config(
        self,
        guardrail_id: Optional[str] = None,
        guardrail_version: Optional[str] = None,
    ) -> Optional[dict]:
        """Create guardrail configuration"""
        if guardrail_id and guardrail_version:
            return {"guardrailId": guardrail_id, "guardrailVersion": guardrail_version}
        return None
    def _create_generation_config(
        self,
        additional_model_fields: Optional[str] = None,
        guardrail_config: Optional[dict] = None,
        text_inference_config: Optional[dict] = None,
        performance_mode: Optional[str] = None,
        prompt_template: Optional[str] = None,
    ) -> dict:
        """Create generation configuration"""
        config = {}
        if additional_model_fields:
            try:
                config["additionalModelRequestFields"] = json.loads(additional_model_fields)
            except json.JSONDecodeError:
                pass
        if guardrail_config:
            config["guardrailConfiguration"] = guardrail_config
        if text_inference_config:
            config["inferenceConfig"] = {"textInferenceConfig": text_inference_config}
        if performance_mode:
            config["performanceConfig"] = {"latency": performance_mode}
        if prompt_template:
            config["promptTemplate"] = {"textPromptTemplate": prompt_template}
        return config
    def _create_orchestration_config(
        self,
        orchestration_additional_model_fields: Optional[str] = None,
        orchestration_text_inference_config: Optional[dict] = None,
        orchestration_performance_mode: Optional[str] = None,
        orchestration_prompt_template: Optional[str] = None,
    ) -> dict:
        """Create orchestration configuration"""
        config = {}
        if orchestration_additional_model_fields:
            try:
                config["additionalModelRequestFields"] = json.loads(orchestration_additional_model_fields)
            except json.JSONDecodeError:
                pass
        if orchestration_text_inference_config:
            config["inferenceConfig"] = {"textInferenceConfig": orchestration_text_inference_config}
        if orchestration_performance_mode:
            config["performanceConfig"] = {"latency": orchestration_performance_mode}
        if orchestration_prompt_template:
            config["promptTemplate"] = {"textPromptTemplate": orchestration_prompt_template}
        return config
    def _create_vector_search_config(
        self,
        number_of_results: int = 5,
        search_type: str = "SEMANTIC",
        metadata_filter: Optional[dict] = None,
    ) -> dict:
        """Create vector search configuration"""
        config = {
            "numberOfResults": number_of_results,
            "overrideSearchType": search_type,
        }
        # Only add filter if metadata_filter is not empty
        if metadata_filter:
            config["filter"] = metadata_filter
        return config
    def _bedrock_retrieve_and_generate(
        self,
        query: str,
        knowledge_base_id: str,
        model_arn: str,
        # Generation Configuration
        additional_model_fields: Optional[str] = None,
        guardrail_id: Optional[str] = None,
        guardrail_version: Optional[str] = None,
        max_tokens: Optional[int] = None,
        stop_sequences: Optional[str] = None,
        temperature: Optional[float] = None,
        top_p: Optional[float] = None,
        performance_mode: str = "standard",
        prompt_template: Optional[str] = None,
        # Orchestration Configuration
        orchestration_additional_model_fields: Optional[str] = None,
        orchestration_max_tokens: Optional[int] = None,
        orchestration_stop_sequences: Optional[str] = None,
        orchestration_temperature: Optional[float] = None,
        orchestration_top_p: Optional[float] = None,
        orchestration_performance_mode: Optional[str] = None,
        orchestration_prompt_template: Optional[str] = None,
        # Retrieval Configuration
        number_of_results: int = 5,
        search_type: str = "SEMANTIC",
        metadata_filter: Optional[dict] = None,
        # Additional Configuration
        session_id: Optional[str] = None,
    ) -> dict[str, Any]:
        try:
            # Create text inference configurations
            text_inference_config = self._create_text_inference_config(max_tokens, stop_sequences, temperature, top_p)
            orchestration_text_inference_config = self._create_text_inference_config(
                orchestration_max_tokens, orchestration_stop_sequences, orchestration_temperature, orchestration_top_p
            )
            # Create guardrail configuration
            guardrail_config = self._create_guardrail_config(guardrail_id, guardrail_version)
            # Create vector search configuration
            vector_search_config = self._create_vector_search_config(number_of_results, search_type, metadata_filter)
            # Create generation configuration
            generation_config = self._create_generation_config(
                additional_model_fields, guardrail_config, text_inference_config, performance_mode, prompt_template
            )
            # Create orchestration configuration
            orchestration_config = self._create_orchestration_config(
                orchestration_additional_model_fields,
                orchestration_text_inference_config,
                orchestration_performance_mode,
                orchestration_prompt_template,
            )
            # Create knowledge base configuration
            knowledge_base_config = {
                "knowledgeBaseId": knowledge_base_id,
                "modelArn": model_arn,
                "generationConfiguration": generation_config,
                "orchestrationConfiguration": orchestration_config,
                "retrievalConfiguration": {"vectorSearchConfiguration": vector_search_config},
            }
            # Create request configuration
            request_config = {
                "input": {"text": query},
                "retrieveAndGenerateConfiguration": {
                    "type": "KNOWLEDGE_BASE",
                    "knowledgeBaseConfiguration": knowledge_base_config,
                },
            }
            # Add session configuration if provided
            if session_id and len(session_id) >= 2:
                request_config["sessionConfiguration"] = {"sessionId": session_id}
                request_config["sessionId"] = session_id
            # Send request
            response = self.bedrock_client.retrieve_and_generate(**request_config)
            # Process response
            result = {"output": response.get("output", {}).get("text", ""), "citations": []}
            # Process citations
            for citation in response.get("citations", []):
                citation_info = {
                    "text": citation.get("generatedResponsePart", {}).get("textResponsePart", {}).get("text", ""),
                    "references": [],
                }
                for ref in citation.get("retrievedReferences", []):
                    reference = {
                        "content": ref.get("content", {}).get("text", ""),
                        "metadata": ref.get("metadata", {}),
                        "location": None,
                    }
                    location = ref.get("location", {})
                    if location.get("type") == "S3":
                        reference["location"] = location.get("s3Location", {}).get("uri")
                    citation_info["references"].append(reference)
                result["citations"].append(citation_info)
            return result
        except Exception as e:
            raise Exception(f"Error calling Bedrock service: {str(e)}")
    def _invoke(
        self,
        user_id: str,
        tool_parameters: dict[str, Any],
    ) -> ToolInvokeMessage:
        try:
            # Initialize Bedrock client if not already initialized
            if not self.bedrock_client:
                aws_region = tool_parameters.get("aws_region")
                aws_access_key_id = tool_parameters.get("aws_access_key_id")
                aws_secret_access_key = tool_parameters.get("aws_secret_access_key")
                client_kwargs = {
                    "service_name": "bedrock-agent-runtime",
                }
                if aws_region:
                    client_kwargs["region_name"] = aws_region
                # Only add credentials if both access key and secret key are provided
                if aws_access_key_id and aws_secret_access_key:
                    client_kwargs.update(
                        {"aws_access_key_id": aws_access_key_id, "aws_secret_access_key": aws_secret_access_key}
                    )
                try:
                    self.bedrock_client = boto3.client(**client_kwargs)
                except Exception as e:
                    return self.create_text_message(f"Failed to initialize Bedrock client: {str(e)}")
            # Parse metadata filter if provided
            metadata_filter = None
            if metadata_filter_str := tool_parameters.get("metadata_filter"):
                try:
                    parsed_filter = json.loads(metadata_filter_str)
                    if parsed_filter:  # Only set if not empty
                        metadata_filter = parsed_filter
                except json.JSONDecodeError:
                    return self.create_text_message("metadata_filter must be a valid JSON string")
            try:
                response = self._bedrock_retrieve_and_generate(
                    query=tool_parameters["query"],
                    knowledge_base_id=tool_parameters["knowledge_base_id"],
                    model_arn=tool_parameters["model_arn"],
                    # Generation Configuration
                    additional_model_fields=tool_parameters.get("additional_model_fields"),
                    guardrail_id=tool_parameters.get("guardrail_id"),
                    guardrail_version=tool_parameters.get("guardrail_version"),
                    max_tokens=tool_parameters.get("max_tokens"),
                    stop_sequences=tool_parameters.get("stop_sequences"),
                    temperature=tool_parameters.get("temperature"),
                    top_p=tool_parameters.get("top_p"),
                    performance_mode=tool_parameters.get("performance_mode", "standard"),
                    prompt_template=tool_parameters.get("prompt_template"),
                    # Orchestration Configuration
                    orchestration_additional_model_fields=tool_parameters.get("orchestration_additional_model_fields"),
                    orchestration_max_tokens=tool_parameters.get("orchestration_max_tokens"),
                    orchestration_stop_sequences=tool_parameters.get("orchestration_stop_sequences"),
                    orchestration_temperature=tool_parameters.get("orchestration_temperature"),
                    orchestration_top_p=tool_parameters.get("orchestration_top_p"),
                    orchestration_performance_mode=tool_parameters.get("orchestration_performance_mode"),
                    orchestration_prompt_template=tool_parameters.get("orchestration_prompt_template"),
                    # Retrieval Configuration
                    number_of_results=tool_parameters.get("number_of_results", 5),
                    search_type=tool_parameters.get("search_type", "SEMANTIC"),
                    metadata_filter=metadata_filter,
                    # Additional Configuration
                    session_id=tool_parameters.get("session_id"),
                )
                return self.create_json_message(response)
            except Exception as e:
                return self.create_text_message(f"Tool invocation error: {str(e)}")
        except Exception as e:
            return self.create_text_message(f"Tool execution error: {str(e)}")
    def validate_parameters(self, parameters: dict[str, Any]) -> None:
        """Validate the parameters"""
        required_params = ["query", "model_arn", "knowledge_base_id"]
        for param in required_params:
            if not parameters.get(param):
                raise ValueError(f"{param} is required")
        # Validate metadata filter if provided
        if metadata_filter_str := parameters.get("metadata_filter"):
            try:
                if not isinstance(json.loads(metadata_filter_str), dict):
                    raise ValueError("metadata_filter must be a valid JSON object")
            except json.JSONDecodeError:
                raise ValueError("metadata_filter must be a valid JSON string")
--- a/api/core/tools/provider/builtin/aws/tools/bedrock_retrieve_and_generate.yaml
+++ b/api/core/tools/provider/builtin/aws/tools/bedrock_retrieve_and_generate.yaml
@ -0,0 +1,358 @@
 identity:
  name: bedrock_retrieve_and_generate
  author: AWS
  label:
    en_US: Bedrock Retrieve and Generate
    zh_Hans: Bedrock检索和生成
  icon: icon.svg
 description:
  human:
    en_US: A tool for retrieving and generating information using Amazon Bedrock Knowledge Base
    zh_Hans: 使用Amazon Bedrock知识库进行信息检索和生成的工具
  llm: A tool for retrieving and generating information using Amazon Bedrock Knowledge Base
 parameters:
 # Additional Configuration
  - name: session_id
    type: string
    required: false
    label:
      en_US: Session ID
      zh_Hans: 会话ID
    human_description:
      en_US: Optional session ID for continuous conversations
      zh_Hans: 用于连续对话的可选会话ID
    form: form
  # AWS Configuration
  - name: aws_region
    type: string
    required: false
    label:
      en_US: AWS Region
      zh_Hans: AWS区域
    human_description:
      en_US: AWS region for the Bedrock service
      zh_Hans: Bedrock服务的AWS区域
    form: form
  - name: aws_access_key_id
    type: string
    required: false
    label:
      en_US: AWS Access Key ID
      zh_Hans: AWS访问密钥ID
    human_description:
      en_US: AWS access key ID for authentication (optional)
      zh_Hans: 用于身份验证的AWS访问密钥ID（可选）
    form: form
  - name: aws_secret_access_key
    type: string
    required: false
    label:
      en_US: AWS Secret Access Key
      zh_Hans: AWS秘密访问密钥
    human_description:
      en_US: AWS secret access key for authentication (optional)
      zh_Hans: 用于身份验证的AWS秘密访问密钥（可选）
    form: form
  # Knowledge Base Configuration
  - name: knowledge_base_id
    type: string
    required: true
    label:
      en_US: Knowledge Base ID
      zh_Hans: 知识库ID
    human_description:
      en_US: ID of the Bedrock Knowledge Base
      zh_Hans: Bedrock知识库的ID
    form: form
  - name: model_arn
    type: string
    required: true
    label:
      en_US: Model ARN
      zh_Hans: 模型ARN
    human_description:
      en_US: The ARN of the model to use
      zh_Hans: 要使用的模型ARN
    form: form
  # Retrieval Configuration
  - name: query
    type: string
    required: true
    label:
      en_US: Query
      zh_Hans: 查询
    human_description:
      en_US: The search query to retrieve information
      zh_Hans: 用于检索信息的查询语句
    form: llm
  - name: number_of_results
    type: number
    required: false
    label:
      en_US: Number of Results
      zh_Hans: 结果数量
    human_description:
      en_US: Number of results to retrieve (1-10)
      zh_Hans: 要检索的结果数量（1-10）
    default: 5
    min: 1
    max: 10
    form: form
  - name: search_type
    type: select
    required: false
    label:
      en_US: Search Type
      zh_Hans: 搜索类型
    human_description:
      en_US: Type of search to perform
      zh_Hans: 要执行的搜索类型
    default: SEMANTIC
    options:
      - value: SEMANTIC
        label:
          en_US: Semantic Search
          zh_Hans: 语义搜索
      - value: HYBRID
        label:
          en_US: Hybrid Search
          zh_Hans: 混合搜索
    form: form
  - name: metadata_filter
    type: string
    required: false
    label:
      en_US: Metadata Filter
      zh_Hans: 元数据过滤器
    human_description:
      en_US: JSON formatted filter conditions for metadata, supporting operations like equals, greaterThan, lessThan, etc.
      zh_Hans: 元数据的JSON格式过滤条件，支持等于、大于、小于等操作
    default: "{}"
    form: form
 # Generation Configuration
  - name: guardrail_id
    type: string
    required: false
    label:
      en_US: Guardrail ID
      zh_Hans: 防护栏ID
    human_description:
      en_US: ID of the guardrail to apply
      zh_Hans: 要应用的防护栏ID
    form: form
  - name: guardrail_version
    type: string
    required: false
    label:
      en_US: Guardrail Version
      zh_Hans: 防护栏版本
    human_description:
      en_US: Version of the guardrail to apply
      zh_Hans: 要应用的防护栏版本
    form: form
  - name: max_tokens
    type: number
    required: false
    label:
      en_US: Maximum Tokens
      zh_Hans: 最大令牌数
    human_description:
      en_US: Maximum number of tokens to generate
      zh_Hans: 生成的最大令牌数
    default: 2048
    form: form
  - name: stop_sequences
    type: string
    required: false
    label:
      en_US: Stop Sequences
      zh_Hans: 停止序列
    human_description:
      en_US: JSON array of strings that will stop generation when encountered
      zh_Hans: JSON数组格式的字符串，遇到这些序列时将停止生成
    default: "[]"
    form: form
  - name: temperature
    type: number
    required: false
    label:
      en_US: Temperature
      zh_Hans: 温度
    human_description:
      en_US: Controls randomness in the output (0-1)
      zh_Hans: 控制输出的随机性（0-1）
    default: 0.7
    min: 0
    max: 1
    form: form
  - name: top_p
    type: number
    required: false
    label:
      en_US: Top P
      zh_Hans: Top P值
    human_description:
      en_US: Controls diversity via nucleus sampling (0-1)
      zh_Hans: 通过核采样控制多样性（0-1）
    default: 0.95
    min: 0
    max: 1
    form: form
  - name: performance_mode
    type: select
    required: false
    label:
      en_US: Performance Mode
      zh_Hans: 性能模式
    human_description:
      en_US: Select performance optimization mode(performanceConfig.latency)
      zh_Hans: 选择性能优化模式(performanceConfig.latency)
    default: standard
    options:
      - value: standard
        label:
          en_US: Standard
          zh_Hans: 标准
      - value: optimized
        label:
          en_US: Optimized
          zh_Hans: 优化
    form: form
  - name: prompt_template
    type: string
    required: false
    label:
      en_US: Prompt Template
      zh_Hans: 提示模板
    human_description:
      en_US: Custom prompt template for generation
      zh_Hans: 用于生成的自定义提示模板
    form: form
  - name: additional_model_fields
    type: string
    required: false
    label:
      en_US: Additional Model Fields
      zh_Hans: 额外模型字段
    human_description:
      en_US: JSON formatted additional fields for model configuration
      zh_Hans: JSON格式的额外模型配置字段
    default: "{}"
    form: form
 # Orchestration Configuration
  - name: orchestration_max_tokens
    type: number
    required: false
    label:
      en_US: Orchestration Maximum Tokens
      zh_Hans: 编排最大令牌数
    human_description:
      en_US: Maximum number of tokens for orchestration
      zh_Hans: 编排过程的最大令牌数
    default: 2048
    form: form
  - name: orchestration_stop_sequences
    type: string
    required: false
    label:
      en_US: Orchestration Stop Sequences
      zh_Hans: 编排停止序列
    human_description:
      en_US: JSON array of strings that will stop orchestration when encountered
      zh_Hans: JSON数组格式的字符串，遇到这些序列时将停止编排
    default: "[]"
    form: form
  - name: orchestration_temperature
    type: number
    required: false
    label:
      en_US: Orchestration Temperature
      zh_Hans: 编排温度
    human_description:
      en_US: Controls randomness in the orchestration output (0-1)
      zh_Hans: 控制编排输出的随机性（0-1）
    default: 0.7
    min: 0
    max: 1
    form: form
  - name: orchestration_top_p
    type: number
    required: false
    label:
      en_US: Orchestration Top P
      zh_Hans: 编排Top P值
    human_description:
      en_US: Controls diversity via nucleus sampling in orchestration (0-1)
      zh_Hans: 通过核采样控制编排的多样性（0-1）
    default: 0.95
    min: 0
    max: 1
    form: form
  - name: orchestration_performance_mode
    type: select
    required: false
    label:
      en_US: Orchestration Performance Mode
      zh_Hans: 编排性能模式
    human_description:
      en_US: Select performance optimization mode for orchestration
      zh_Hans: 选择编排的性能优化模式
    default: standard
    options:
      - value: standard
        label:
          en_US: Standard
          zh_Hans: 标准
      - value: optimized
        label:
          en_US: Optimized
          zh_Hans: 优化
    form: form
  - name: orchestration_prompt_template
    type: string
    required: false
    label:
      en_US: Orchestration Prompt Template
      zh_Hans: 编排提示模板
    human_description:
      en_US: Custom prompt template for orchestration
      zh_Hans: 用于编排的自定义提示模板
    form: form
  - name: orchestration_additional_model_fields
    type: string
    required: false
    label:
      en_US: Orchestration Additional Model Fields
      zh_Hans: 编排额外模型字段
    human_description:
      en_US: JSON formatted additional fields for orchestration model configuration
      zh_Hans: JSON格式的编排模型额外配置字段
    default: "{}"
    form: form
--- a/api/poetry.lock
+++ b/api/poetry.lock
@ -931,36 +931,36 @@ files = [
 [[package]]
 name = "boto3"
-version = "1.35.74"
+version = "1.36.4"
 description = "The AWS SDK for Python"
 optional = false
 python-versions = ">=3.8"
 groups = ["main"]
 markers = "python_version == \"3.11\" or python_version >= \"3.12\""
 files = [
-    {file = "boto3-1.35.74-py3-none-any.whl", hash = "sha256:dab5bddbbe57dc707b6f6a1f25dc2823b8e234b6fe99fafef7fc406ab73031b9"},
+    {file = "boto3-1.36.4-py3-none-any.whl", hash = "sha256:9f8f699e75ec63fcc98c4dd7290997c7c06c68d3ac8161ad4735fe71f5fe945c"},
-    {file = "boto3-1.35.74.tar.gz", hash = "sha256:88370c6845ba71a4dae7f6b357099df29b3965da584be040c8e72c9902bc9492"},
+    {file = "boto3-1.36.4.tar.gz", hash = "sha256:eeceeb74ef8b65634d358c27aa074917f4449dc828f79301f1075232618eb502"},
 ]
 [package.dependencies]
-botocore = ">=1.35.74,<1.36.0"
+botocore = ">=1.36.4,<1.37.0"
 jmespath = ">=0.7.1,<2.0.0"
-s3transfer = ">=0.10.0,<0.11.0"
+s3transfer = ">=0.11.0,<0.12.0"
 [package.extras]
 crt = ["botocore[crt] (>=1.21.0,<2.0a0)"]
 [[package]]
 name = "botocore"
-version = "1.35.94"
+version = "1.36.5"
 description = "Low-level, data-driven core of boto 3."
 optional = false
 python-versions = ">=3.8"
 groups = ["main"]
 markers = "python_version == \"3.11\" or python_version >= \"3.12\""
 files = [
-    {file = "botocore-1.35.94-py3-none-any.whl", hash = "sha256:d784d944865d8279c79d2301fc09ac28b5221d4e7328fb4e23c642c253b9932c"},
+    {file = "botocore-1.36.5-py3-none-any.whl", hash = "sha256:6d9f70afa9bf9d21407089dc22b8cc8ec6fa44866d4660858c062c74fc8555eb"},
-    {file = "botocore-1.35.94.tar.gz", hash = "sha256:2b3309b356541faa4d88bb957dcac1d8004aa44953c0b7d4521a6cc5d3d5d6ba"},
+    {file = "botocore-1.36.5.tar.gz", hash = "sha256:234ed3d29a8954c37a551c933453bf14c6ae44a69a4f273ffef377a2612ca6a6"},
 ]
 [package.dependencies]
@ -969,7 +969,7 @@ python-dateutil = ">=2.1,<3.0.0"
 urllib3 = {version = ">=1.25.4,<2.2.0 || >2.2.0,<3", markers = "python_version >= \"3.10\""}
 [package.extras]
-crt = ["awscrt (==0.22.0)"]
+crt = ["awscrt (==0.23.4)"]
 [[package]]
 name = "bottleneck"
@ -2126,7 +2126,6 @@ files = [
    {file = "cryptography-44.0.0-cp37-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:761817a3377ef15ac23cd7834715081791d4ec77f9297ee694ca1ee9c2c7e5eb"},
    {file = "cryptography-44.0.0-cp37-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:3c672a53c0fb4725a29c303be906d3c1fa99c32f58abe008a82705f9ee96f40b"},
    {file = "cryptography-44.0.0-cp37-abi3-manylinux_2_34_aarch64.whl", hash = "sha256:4ac4c9f37eba52cb6fbeaf5b59c152ea976726b865bd4cf87883a7e7006cc543"},
    {file = "cryptography-44.0.0-cp37-abi3-manylinux_2_34_x86_64.whl", hash = "sha256:60eb32934076fa07e4316b7b2742fa52cbb190b42c2df2863dbc4230a0a9b385"},
    {file = "cryptography-44.0.0-cp37-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:ed3534eb1090483c96178fcb0f8893719d96d5274dfde98aa6add34614e97c8e"},
    {file = "cryptography-44.0.0-cp37-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:f3f6fdfa89ee2d9d496e2c087cebef9d4fcbb0ad63c40e821b39f74bf48d9c5e"},
    {file = "cryptography-44.0.0-cp37-abi3-win32.whl", hash = "sha256:eb33480f1bad5b78233b0ad3e1b0be21e8ef1da745d8d2aecbb20671658b9053"},
@ -2137,7 +2136,6 @@ files = [
    {file = "cryptography-44.0.0-cp39-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:c5eb858beed7835e5ad1faba59e865109f3e52b3783b9ac21e7e47dc5554e289"},
    {file = "cryptography-44.0.0-cp39-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:f53c2c87e0fb4b0c00fa9571082a057e37690a8f12233306161c8f4b819960b7"},
    {file = "cryptography-44.0.0-cp39-abi3-manylinux_2_34_aarch64.whl", hash = "sha256:9e6fc8a08e116fb7c7dd1f040074c9d7b51d74a8ea40d4df2fc7aa08b76b9e6c"},
    {file = "cryptography-44.0.0-cp39-abi3-manylinux_2_34_x86_64.whl", hash = "sha256:9abcc2e083cbe8dde89124a47e5e53ec38751f0d7dfd36801008f316a127d7ba"},
    {file = "cryptography-44.0.0-cp39-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:d2436114e46b36d00f8b72ff57e598978b37399d2786fd39793c36c6d5cb1c64"},
    {file = "cryptography-44.0.0-cp39-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:a01956ddfa0a6790d594f5b34fc1bfa6098aca434696a03cfdbe469b8ed79285"},
    {file = "cryptography-44.0.0-cp39-abi3-win32.whl", hash = "sha256:eca27345e1214d1b9f9490d200f9db5a874479be914199194e746c893788d417"},
@ -7803,6 +7801,7 @@ files = [
    {file = "psycopg2_binary-2.9.10-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:bb89f0a835bcfc1d42ccd5f41f04870c1b936d8507c6df12b7737febc40f0909"},
    {file = "psycopg2_binary-2.9.10-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:f0c2d907a1e102526dd2986df638343388b94c33860ff3bbe1384130828714b1"},
    {file = "psycopg2_binary-2.9.10-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:f8157bed2f51db683f31306aa497311b560f2265998122abe1dce6428bd86567"},
    {file = "psycopg2_binary-2.9.10-cp313-cp313-win_amd64.whl", hash = "sha256:27422aa5f11fbcd9b18da48373eb67081243662f9b46e6fd07c3eb46e4535142"},
    {file = "psycopg2_binary-2.9.10-cp38-cp38-macosx_12_0_x86_64.whl", hash = "sha256:eb09aa7f9cecb45027683bb55aebaaf45a0df8bf6de68801a6afdc7947bb09d4"},
    {file = "psycopg2_binary-2.9.10-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b73d6d7f0ccdad7bc43e6d34273f70d587ef62f824d7261c4ae9b8b1b6af90e8"},
    {file = "psycopg2_binary-2.9.10-cp38-cp38-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:ce5ab4bf46a211a8e924d307c1b1fcda82368586a19d0a24f8ae166f5c784864"},
@ -9563,22 +9562,22 @@ files = [
 [[package]]
 name = "s3transfer"
-version = "0.10.4"
+version = "0.11.2"
 description = "An Amazon S3 Transfer Manager"
 optional = false
 python-versions = ">=3.8"
 groups = ["main"]
 markers = "python_version == \"3.11\" or python_version >= \"3.12\""
 files = [
-    {file = "s3transfer-0.10.4-py3-none-any.whl", hash = "sha256:244a76a24355363a68164241438de1b72f8781664920260c48465896b712a41e"},
+    {file = "s3transfer-0.11.2-py3-none-any.whl", hash = "sha256:be6ecb39fadd986ef1701097771f87e4d2f821f27f6071c872143884d2950fbc"},
-    {file = "s3transfer-0.10.4.tar.gz", hash = "sha256:29edc09801743c21eb5ecbc617a152df41d3c287f67b615f73e5f750583666a7"},
+    {file = "s3transfer-0.11.2.tar.gz", hash = "sha256:3b39185cb72f5acc77db1a58b6e25b977f28d20496b6e58d6813d75f464d632f"},
 ]
 [package.dependencies]
-botocore = ">=1.33.2,<2.0a.0"
+botocore = ">=1.36.0,<2.0a.0"
 [package.extras]
-crt = ["botocore[crt] (>=1.33.2,<2.0a.0)"]
+crt = ["botocore[crt] (>=1.36.0,<2.0a.0)"]
 [[package]]
 name = "safetensors"
@ -12248,4 +12247,4 @@ cffi = ["cffi (>=1.11)"]
 [metadata]
 lock-version = "2.1"
 python-versions = ">=3.11,<3.13"
-content-hash = "fdc2199389f0e4b6d81b4b7fe2c1d303b1995643fe802ad3a28b196e68c258ae"
+content-hash = "a8fff72e974a1bd5c28f4ae326d120410a5628ad0bc65d87adca4e943130ec8f"
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@ -21,7 +21,7 @@ azure-ai-inference = "~1.0.0b3"
 azure-ai-ml = "~1.20.0"
 azure-identity = "1.16.1"
 beautifulsoup4 = "4.12.2"
-boto3 = "1.35.74"
+boto3 = "1.36.4"
 bs4 = "~0.0.1"
 cachetools = "~5.3.0"
 celery = "~5.4.0"